SearchGPT

Running

App Files Files Community

Shreyas094 commited on Jul 25, 2024

Commit

d3d8817

verified ·

1 Parent(s): 1a36c36

Update app.py

Browse files

Files changed (1) hide show

app.py +32 -1

app.py CHANGED Viewed

@@ -18,6 +18,8 @@ import inspect
 # Environment variables and configurations
 huggingface_token = os.environ.get("HUGGINGFACE_TOKEN")
 llama_cloud_api_key = os.environ.get("LLAMA_CLOUD_API_KEY")
 MODELS = [
     "Qwen/Qwen2-72B-Instruct",
@@ -26,7 +28,8 @@ MODELS = [
     "Qwen/Qwen2-7B-Instruct",
     "mistralai/Mistral-Nemo-Instruct-2407",
     "mistralai/Mistral-7B-Instruct-v0.3",
-    "mistralai/Mixtral-8x7B-Instruct-v0.1"
 ]
 # Initialize LlamaParse
@@ -82,6 +85,9 @@ def update_vectors(files, parser):
     return f"Vector store updated successfully. Processed {total_chunks} chunks from {len(files)} files using {parser}."
 def generate_chunked_response(prompt, model, max_tokens=1000, max_chunks=5, temperature=0.7):
     client = InferenceClient(
         model,
         token=huggingface_token,
@@ -111,6 +117,31 @@ def generate_chunked_response(prompt, model, max_tokens=1000, max_chunks=5, temp
     return clean_response
 def duckduckgo_search(query):
     with DDGS() as ddgs:
         results = ddgs.text(query, max_results=5)

 # Environment variables and configurations
 huggingface_token = os.environ.get("HUGGINGFACE_TOKEN")
 llama_cloud_api_key = os.environ.get("LLAMA_CLOUD_API_KEY")
+CLOUDFLARE_ACCOUNT_ID = os.environ.get("CLOUDFLARE_ACCOUNT_ID")
+CLOUDFLARE_AUTH_TOKEN = os.environ.get("CLOUDFLARE_AUTH_TOKEN")
 MODELS = [
     "Qwen/Qwen2-72B-Instruct",
     "Qwen/Qwen2-7B-Instruct",
     "mistralai/Mistral-Nemo-Instruct-2407",
     "mistralai/Mistral-7B-Instruct-v0.3",
+    "mistralai/Mixtral-8x7B-Instruct-v0.1",
+    "cloudflare/llama-3.1-8b-instruct"  # Added Cloudflare Llama 3.1 model
 ]
 # Initialize LlamaParse
     return f"Vector store updated successfully. Processed {total_chunks} chunks from {len(files)} files using {parser}."
 def generate_chunked_response(prompt, model, max_tokens=1000, max_chunks=5, temperature=0.7):
+    if model == "cloudflare/llama-3.1-8b-instruct":
+        return generate_cloudflare_response(prompt, max_tokens, temperature)
     client = InferenceClient(
         model,
         token=huggingface_token,
     return clean_response
+def generate_cloudflare_response(prompt, max_tokens, temperature):
+    try:
+        response = requests.post(
+            f"https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/run/@cf/meta/llama-3.1-8b-instruct",
+            headers={"Authorization": f"Bearer {CLOUDFLARE_AUTH_TOKEN}"},
+            json={
+                "messages": [
+                    {"role": "system", "content": "You are a friendly assistant"},
+                    {"role": "user", "content": prompt}
+                ],
+                "max_tokens": max_tokens,
+                "temperature": temperature
+            }
+        )
+        result = response.json()
+        if 'result' in result and 'response' in result['result']:
+            return result['result']['response']
+        else:
+            print(f"Unexpected response format: {result}")
+            return "Error: Unexpected response format from Cloudflare API"
+    except Exception as e:
+        print(f"Error in generating Cloudflare response: {str(e)}")
+        return f"Error: {str(e)}"
 def duckduckgo_search(query):
     with DDGS() as ddgs:
         results = ddgs.text(query, max_results=5)