Spaces:

Daemontatox
/

Mawared-Support-Assistant

Running

Daemontatox commited on Jan 10

Commit

bb9892b

verified ·

1 Parent(s): f29fd49

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -105,20 +105,17 @@ retriever = db.as_retriever(
 # Load model directly
-model_id="CohereForAI/c4ai-command-r7b-12-2024"
-tokenizer = AutoTokenizer.from_pretrained(model_id)
-model = AutoModelForCausalLM.from_pretrained(model_id)
-pipe = pipeline("text-generation", model=model, tokenizer=tokenizer)
-llm = HuggingFacePipeline(pipeline=pipe)
 # Set up the LLM
-#llm = ChatOpenAI(
-#    base_url="https://api-inference.huggingface.co/v1/",
-  #  temperature=0,
-   # api_key=HF_TOKEN,
-  #  model="meta-llama/Llama-3.3-70B-Instruct"
-#)
 # Create prompt template with chat history
 template = """
@@ -158,7 +155,7 @@ def create_rag_chain(chat_history: str):
 chat_history = ChatHistory()
 # Gradio Function
-@spaces.GPU
 def ask_question_gradio(question, history):
     try:
         # Add user question to chat history

 # Load model directly
 # Set up the LLM
+llm = ChatOpenAI(
+    base_url="https://api-inference.huggingface.co/v1/",
+    temperature=0,
+    api_key=HF_TOKEN,
+    model="Qwen/Qwen2.5-Coder-32B-Instruct",
+    stream=True
+)
 # Create prompt template with chat history
 template = """
 chat_history = ChatHistory()
 # Gradio Function
 def ask_question_gradio(question, history):
     try:
         # Add user question to chat history