Spaces:

mgbam
/

builder

Sleeping

App Files Files Community

mgbam commited on Jul 23

Commit

7234f57

verified ·

1 Parent(s): 71a8f19

Update hf_client.py

Browse files

Files changed (1) hide show

hf_client.py +42 -30

hf_client.py CHANGED Viewed

@@ -1,34 +1,56 @@
-### hf_client.py
-from huggingface_hub import InferenceClient, HfApi
-from tavily import TavilyClient
 import os
-# HF Inference Client
-# Supported billing targets
-_VALID_BILL_TO = {"huggingface", "fairworksai", "groq"}
 HF_TOKEN = os.getenv("HF_TOKEN")
 if not HF_TOKEN:
-    raise RuntimeError(
-        "HF_TOKEN environment variable is not set. "
-        "Please set it to your Hugging Face API token."
-    )
 def get_inference_client(model_id: str, provider: str = "auto") -> InferenceClient:
     """
-    Return an InferenceClient configured with the correct provider and billing target.
-    - If model_id == "moonshotai/Kimi-K2-Instruct", force provider to "groq".
-    - If the requested provider is not one of the supported billing targets,
-      default billing to "groq".
     """
-    # force certain models onto groq hardware
     if model_id == "moonshotai/Kimi-K2-Instruct":
         provider = "groq"
-    # determine billing target
     bill_to = provider if provider in _VALID_BILL_TO else "groq"
     return InferenceClient(
@@ -36,13 +58,3 @@ def get_inference_client(model_id: str, provider: str = "auto") -> InferenceClie
         api_key=HF_TOKEN,
         bill_to=bill_to
     )
-# Tavily Search Client
-TAVILY_API_KEY = os.getenv('TAVILY_API_KEY')
-tavily_client = None
-if TAVILY_API_KEY:
-    try:
-        tavily_client = TavilyClient(api_key=TAVILY_API_KEY)
-    except Exception as e:
-        print(f"Failed to initialize Tavily client: {e}")
-        tavily_client = None

+# hf_client.py
 import os
+from typing import Optional
+from huggingface_hub import InferenceClient
+from tavily import TavilyClient
+# Supported billing targets (your secrets)
+_VALID_BILL_TO = {
+    "huggingface",  # HF_TOKEN
+    "fairworksai",  # if you have a special billing target
+    "groq",         # GROQ_API_KEY
+    "openai",       # OPENAI_API_KEY
+    "gemini",       # GEMINI_API_KEY
+    "fireworks"     # FIREWORKS_API_KEY
+}
+# Load your HF token
 HF_TOKEN = os.getenv("HF_TOKEN")
 if not HF_TOKEN:
+    raise RuntimeError("HF_TOKEN is not set. Please configure your Hugging Face token.")
+# (Optional) Tavily client for web search
+TAVILY_API_KEY = os.getenv("TAVILY_API_KEY")
+tavily_client: Optional[TavilyClient] = None
+if TAVILY_API_KEY:
+    try:
+        tavily_client = TavilyClient(api_key=TAVILY_API_KEY)
+    except Exception as e:
+        print(f"❗ Failed to init Tavily: {e}")
 def get_inference_client(model_id: str, provider: str = "auto") -> InferenceClient:
     """
+    Selects the appropriate inference provider & billing target:
+      • moonshotai/Kimi-K2-Instruct  → groq
+      • openai/... or GPT family     → openai
+      • gemini/... or google/...     → gemini
+      • fireworks/...                → fireworks
+      • otherwise                    → huggingface (billing to groq)
     """
+    # override by model prefix
     if model_id == "moonshotai/Kimi-K2-Instruct":
         provider = "groq"
+    elif model_id.startswith("openai/") or model_id in {"gpt-4", "gpt-3.5-turbo"}:
+        provider = "openai"
+    elif model_id.startswith("gemini/") or model_id.startswith("google/"):
+        provider = "gemini"
+    elif model_id.startswith("fireworks/"):
+        provider = "fireworks"
+    else:
+        provider = "huggingface"
+    # ensure billing target is valid, else fallback to groq
     bill_to = provider if provider in _VALID_BILL_TO else "groq"
     return InferenceClient(
         api_key=HF_TOKEN,
         bill_to=bill_to
     )