Spaces:

Daemontatox
/

Mawared-Support-Assistant

Running

Daemontatox commited on Jan 12

Commit

9c4781b

verified ·

1 Parent(s): 4c81ad7

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -108,16 +108,28 @@ retriever = db.as_retriever(
 # Set up the LLM
-llm = ChatOpenAI(
-    base_url="https://api-inference.huggingface.co/v1/",
-    temperature=0,
-    api_key=HF_TOKEN,
-    model="meta-llama/Llama-3.3-70B-Instruct",
-    max_tokens=None,
-    timeout=None
 )
 # Create prompt template with chat history
 template = """
 You are an expert assistant specializing in the Mawared HR System.
@@ -138,6 +150,9 @@ Answer:
 prompt = ChatPromptTemplate.from_template(template)
 # Create the RAG chain with chat history
 def create_rag_chain(chat_history: str):
     chain = (
         {

 # Set up the LLM
+# llm = ChatOpenAI(
+#     base_url="https://api-inference.huggingface.co/v1/",
+#     temperature=0,
+#     api_key=HF_TOKEN,
+#     model="meta-llama/Llama-3.3-70B-Instruct",
+#     max_tokens=None,
+#     timeout=None
+# )
+repo_id = "CohereForAI/c4ai-command-r7b-12-2024"
+llm = HuggingFaceEndpoint(
+    repo_id=repo_id,
+    max_length=8192,
+    temperature=0,
+    huggingfacehub_api_token=HF_TOKEN,
 )
 # Create prompt template with chat history
 template = """
 You are an expert assistant specializing in the Mawared HR System.
 prompt = ChatPromptTemplate.from_template(template)
 # Create the RAG chain with chat history
+@spcaes.GPU(600)
 def create_rag_chain(chat_history: str):
     chain = (
         {