Spaces:

Daemontatox
/

Mawared-Support-Assistant

Running

Daemontatox commited on Jan 12

Commit

14bd49d

verified ·

1 Parent(s): 5c2fca1

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -121,16 +121,30 @@ retriever = db.as_retriever(
 # Set up the LLM
 llm = ChatOpenAI(
-    base_url="https://api-inference.huggingface.co/v1/",
     temperature=0,
     api_key=HF_TOKEN,
-    model="mistralai/Mistral-Nemo-Instruct-2407",
     max_tokens=None,
     timeout=None
 )
 # quantization_config = BitsAndBytesConfig(
 #         load_in_4bit=True,
 #         bnb_4bit_compute_dtype=torch.bfloat16,

 # Set up the LLM
+# llm = ChatOpenAI(
+#     base_url="https://api-inference.huggingface.co/v1/",
+#     temperature=0,
+#     api_key=HF_TOKEN,
+#     model="mistralai/Mistral-Nemo-Instruct-2407",
+#     max_tokens=None,
+#     timeout=None
+# )
 llm = ChatOpenAI(
+    base_url="https://openrouter.ai/api/v1",
     temperature=0,
     api_key=HF_TOKEN,
+    model="google/gemini-2.0-flash-exp:free",
     max_tokens=None,
     timeout=None
 )
 # quantization_config = BitsAndBytesConfig(
 #         load_in_4bit=True,
 #         bnb_4bit_compute_dtype=torch.bfloat16,