Spaces:

mgbam
/

builder

Running

mgbam commited on Jul 23

Commit

ac4a3a2

verified ·

1 Parent(s): 2541fb7

Update hf_client.py

Files changed (1) hide show

hf_client.py CHANGED Viewed

@@ -5,18 +5,36 @@ from tavily import TavilyClient
 import os
 # HF Inference Client
-HF_TOKEN = os.getenv('HF_TOKEN')
 if not HF_TOKEN:
-    raise RuntimeError("HF_TOKEN environment variable is not set. Please set it to your Hugging Face API token.")
-def get_inference_client(model_id, provider="auto"):
-    """Return an InferenceClient with provider based on model_id and user selection."""
     if model_id == "moonshotai/Kimi-K2-Instruct":
         provider = "groq"
     return InferenceClient(
         provider=provider,
         api_key=HF_TOKEN,
-        bill_to="huggingface"
     )
 # Tavily Search Client

 import os
 # HF Inference Client
+# Supported billing targets
+_VALID_BILL_TO = {"huggingface", "fairworksai", "groq"}
+HF_TOKEN = os.getenv("HF_TOKEN")
 if not HF_TOKEN:
+    raise RuntimeError(
+        "HF_TOKEN environment variable is not set. "
+        "Please set it to your Hugging Face API token."
+    )
+def get_inference_client(model_id: str, provider: str = "auto") -> InferenceClient:
+    """
+    Return an InferenceClient configured with the correct provider and billing target.
+    - If model_id == "moonshotai/Kimi-K2-Instruct", force provider to "groq".
+    - If the requested provider is not one of the supported billing targets,
+      default billing to "groq".
+    """
+    # force certain models onto groq hardware
     if model_id == "moonshotai/Kimi-K2-Instruct":
         provider = "groq"
+    # determine billing target
+    bill_to = provider if provider in _VALID_BILL_TO else "groq"
     return InferenceClient(
         provider=provider,
         api_key=HF_TOKEN,
+        bill_to=bill_to
     )
 # Tavily Search Client