parserPDF / llm /llm_login.py
semmyk's picture
baseline08_beta0.3.0_01Oct25: refactor oauth log in, - Marker converter, dropped llm_client, - add force_ocr: to phase in cli-option
8290881
raw
history blame
5.04 kB
from huggingface_hub import HfApi, login, logout, get_token, whoami
import os
import traceback
from time import sleep
from typing import Optional
from utils.logger import get_logger
from ui.gradio_ui import gr
## Get logger instance
logger = get_logger(__name__)
def disable_immplicit_token():
# Disable implicit token propagation for determinism
# Explicitly disable implicit token propagation; we rely on explicit auth or env var
os.environ["HF_HUB_DISABLE_IMPLICIT_TOKEN"] = "1"
#def get_login_token( api_token_arg, oauth_token: gr.OAuthToken | None=None,):
def get_login_token( api_token_arg, oauth_token):
""" Use user's supplied token or Get token from logged-in users, else from token stored on the machine. Return token"""
#oauth_token = get_token() if oauth_token is not None else api_token_arg
if api_token_arg != '': # or not None: #| None:
oauth_token = api_token_arg
elif oauth_token:
oauth_token = oauth_token.token
else: oauth_token = '' if not get_token() else get_token()
#return str(oauth_token) if oauth_token else '' ##token value or empty string
return oauth_token if oauth_token else '' ##token value or empty string
def login_huggingface(token: Optional[str] = None):
"""
Login to Hugging Face account. Prioritize CLI login for privacy and determinism.
Attempts to log in to Hugging Face Hub.
First, it tries to log in interactively via the Hugging Face CLI.
If that fails, it falls back to using a token provided as an argument or
found in the environment variables HF_TOKEN or HUGGINGFACEHUB_API_TOKEN.
If both methods fail, it logs a warning and continues without logging in.
"""
logger.info("Attempting Hugging Face login...")
# Disable implicit token propagation for determinism
# Explicitly disable implicit token propagation; we rely on explicit auth or env var
#os.environ["HF_HUB_DISABLE_IMPLICIT_TOKEN"] = "1"
disable_immplicit_token()
token = token
# Privacy-first login: try interactive CLI first; fallback to provided/env token only if needed
try:
#if HfApi.whoami(): ##SMY requires 'self' = HfApi. Alternatively HfApi().whoami()
if whoami(): ##SMY: Call HF API to know "whoami".
logger.info("βœ”οΈ hf_login already: whoami()", extra={"mode": "HF Oauth"})
#return True
else:
login() ##SMY: Not visible/interactive to users on HF Space. ## ProcessPoll limitation
sleep(5) ##SMY pause for login. Helpful: pool async opex
logger.info("βœ”οΈ hf_login already: login()", extra={"mode": "cli"})
#return True
except Exception as exc:
# Respect common env var names; prefer explicit token arg when provided
fallback_token = token if token else get_token() or os.getenv("HF_TOKEN") or os.getenv("HUGGINGFACEHUB_API_TOKEN") ##SMY: to revisit
if fallback_token:
try:
login(token=fallback_token)
#token = fallback_token ##debug
logger.info("βœ”οΈ hf_login through fallback", extra={"mode": "token"}) ##SMY: This only displays if token is provided
except Exception as exc_token:
logger.warning("❌ hf_login_failed through fallback", extra={"error": str(exc_token)})
else:
logger.warning("❌ hf_login_failed", extra={"error": str(exc)})
# Silent fallback; client will still work if token is passed directly
#pass
#def is_login_huggingface():
def is_loggedin_huggingface(token: Optional[str] = None):
#from huggingface_hub import HfApi
from huggingface_hub.utils import HfHubHTTPError
from huggingface_hub.errors import LocalTokenNotFoundError
try: ##SMY: TOOD: investigate if still needed given oauth_token: gr.OAuthToken
HfApi().whoami()
logger.log(level=20, msg=("βœ”οΈ HfApi().whoami(): You are logged in."), extra={"is_logged_in": True})
disable_immplicit_token()
return True
except LocalTokenNotFoundError as exc: #Token is required (`token=True`), but no token found
HfApi().whoami(token)
logger.log(level=20, msg=("βœ”οΈ HfApi().whoami(): You are logged in with token."), extra={"is_logged_in": True})
disable_immplicit_token()
return True
except HfHubHTTPError as exc:
# A 401 status code indicates an authentication error.
if exc.response.status_code == 401:
print("⚠️ You are not logged in. You can still access public models.")
else:
# Handle other HTTP errors if necessary
#print(f"An unexpected HTTP error occurred: {exc}")
tb = traceback.format_exc()
logger.exception(f"βœ— An unexpected HTTP error occurred: β†’ {exc}\n{tb}", exc_info=True)
#raise RuntimeError(f"βœ— An unexpected HTTP error occurred: β†’ {exc}\n{tb}") from exc
return False
finally: return False