Spaces:

mgbam
/

builder

Sleeping

App Files Files Community

mgbam commited on Jul 23

Commit

e2e2a15

verified ·

1 Parent(s): 7234f57

Update hf_client.py

Browse files

Files changed (1) hide show

hf_client.py +24 -24

hf_client.py CHANGED Viewed

@@ -5,40 +5,39 @@ from typing import Optional
 from huggingface_hub import InferenceClient
 from tavily import TavilyClient
-# Supported billing targets (your secrets)
-_VALID_BILL_TO = {
-    "huggingface",  # HF_TOKEN
-    "fairworksai",  # if you have a special billing target
-    "groq",         # GROQ_API_KEY
-    "openai",       # OPENAI_API_KEY
-    "gemini",       # GEMINI_API_KEY
-    "fireworks"     # FIREWORKS_API_KEY
-}
-# Load your HF token
 HF_TOKEN = os.getenv("HF_TOKEN")
 if not HF_TOKEN:
-    raise RuntimeError("HF_TOKEN is not set. Please configure your Hugging Face token.")
-# (Optional) Tavily client for web search
-TAVILY_API_KEY = os.getenv("TAVILY_API_KEY")
 tavily_client: Optional[TavilyClient] = None
 if TAVILY_API_KEY:
     try:
         tavily_client = TavilyClient(api_key=TAVILY_API_KEY)
     except Exception as e:
-        print(f"❗ Failed to init Tavily: {e}")
 def get_inference_client(model_id: str, provider: str = "auto") -> InferenceClient:
     """
-    Selects the appropriate inference provider & billing target:
-      • moonshotai/Kimi-K2-Instruct  → groq
-      • openai/... or GPT family     → openai
-      • gemini/... or google/...     → gemini
-      • fireworks/...                → fireworks
-      • otherwise                    → huggingface (billing to groq)
     """
-    # override by model prefix
     if model_id == "moonshotai/Kimi-K2-Instruct":
         provider = "groq"
     elif model_id.startswith("openai/") or model_id in {"gpt-4", "gpt-3.5-turbo"}:
@@ -48,9 +47,10 @@ def get_inference_client(model_id: str, provider: str = "auto") -> InferenceClie
     elif model_id.startswith("fireworks/"):
         provider = "fireworks"
     else:
-        provider = "huggingface"
-    # ensure billing target is valid, else fallback to groq
     bill_to = provider if provider in _VALID_BILL_TO else "groq"
     return InferenceClient(

 from huggingface_hub import InferenceClient
 from tavily import TavilyClient
+# Supported billing targets
+_VALID_BILL_TO = {"huggingface", "fairworksai", "groq", "openai", "gemini", "fireworks", "googler"}
+# Load Hugging Face token
 HF_TOKEN = os.getenv("HF_TOKEN")
 if not HF_TOKEN:
+    raise RuntimeError(
+        "HF_TOKEN environment variable is not set. "
+        "Please set it to your Hugging Face API token."
+    )
+# Initialize Tavily search client (optional)
+TAVILY_API_KEY = os.getenv('TAVILY_API_KEY')
 tavily_client: Optional[TavilyClient] = None
 if TAVILY_API_KEY:
     try:
         tavily_client = TavilyClient(api_key=TAVILY_API_KEY)
     except Exception as e:
+        print(f"Failed to initialize Tavily client: {e}")
+        tavily_client = None
 def get_inference_client(model_id: str, provider: str = "auto") -> InferenceClient:
     """
+    Configure InferenceClient based on model_id prefixes:
+      - moonshotai/Kimi-K2-Instruct → provider "groq"
+      - openai/... or GPT names       → provider "openai"
+      - gemini/... or google/...     → provider "gemini"
+      - fireworks/...                → provider "fireworks"
+      - otherwise                     → use HF Inference provider (auto)
+    Bill to the chosen provider if valid; otherwise, default to "groq".
     """
+    # Override provider by model
     if model_id == "moonshotai/Kimi-K2-Instruct":
         provider = "groq"
     elif model_id.startswith("openai/") or model_id in {"gpt-4", "gpt-3.5-turbo"}:
     elif model_id.startswith("fireworks/"):
         provider = "fireworks"
     else:
+        # For Hugging Face models, let HF Inference pick best provider
+        provider = "auto"
+    # Determine billing target
     bill_to = provider if provider in _VALID_BILL_TO else "groq"
     return InferenceClient(