DorjGPT_assistant

Sleeping

App Files Files Community

Dorjzodovsuren commited on Mar 25

Commit

e8674ce

verified ·

1 Parent(s): 46f10a0

Update app.py

Browse files

Files changed (1) hide show

app.py +22 -35

app.py CHANGED Viewed

@@ -7,26 +7,13 @@ from huggingface_hub import InferenceClient
 """
 For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
 """
-#client = InferenceClient("google/gemma-3-27b-it", token=os.getenv("TOKEN"))
-client = InferenceClient(
-    provider="fireworks-ai",
-    api_key=os.getenv("TOKEN"),
-)
-# completion = client.chat.completions.create(
-#     model="deepseek-ai/DeepSeek-V3-0324",
-#     messages=[
-#         {
-#             "role": "user",
-#             "content": "What is the capital of France?"
-#         }
-#     ],
-#     max_tokens=500,
 # )
-# print(completion.choices[0].message)
 global history
 history = []
 async def respond(
@@ -47,26 +34,26 @@ async def respond(
     messages.append({"role": "user", "content": message})
-    #response = ""
-    #for message in client.chat_completion(
-    #     model="deepseek-ai/DeepSeek-V3-0324",
-    #     messages=messages,
-    #     max_tokens=max_tokens,
-    #     stream=True,
-    #     temperature=temperature,
-    #     top_p=top_p,
-    # ):
-    #     token = message.choices[0].delta.content
-    #     response += token
-    completion = client.chat.completions.create(
-        model="deepseek-ai/DeepSeek-R1",
         messages=messages,
-        max_tokens=500,
-    )
-    response = completion.choices[0].message.content
-    print(response)
     communicate = edge_tts.Communicate(response, voice="mn-MN-YesuiNeural")
     with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp_file:

 """
 For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
 """
+client = InferenceClient("google/gemma-3-27b-it", token=os.getenv("TOKEN"))
+# client = InferenceClient(
+#     provider="fireworks-ai",
+#     api_key=os.getenv("TOKEN"),
 # )
 global history
 history = []
 async def respond(
     messages.append({"role": "user", "content": message})
+    response = ""
+    for message in client.chat_completion(
+        model="google/gemma-3-27b-it",
         messages=messages,
+        max_tokens=max_tokens,
+        stream=True,
+        temperature=temperature,
+        top_p=top_p,
+    ):
+        token = message.choices[0].delta.content
+        response += token
+    # completion = client.chat.completions.create(
+    #     model="deepseek-ai/DeepSeek-R1",
+    #     messages=messages,
+    #     max_tokens=500,
+    # )
+    # response = completion.choices[0].message.content
+    # print(response)
     communicate = edge_tts.Communicate(response, voice="mn-MN-YesuiNeural")
     with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp_file: