Sentinel-AI-Beta-Test

Sleeping

App Files Files Community

Shreyas094 commited on Aug 30, 2024

Commit

42fe9e9

verified ·

1 Parent(s): a3c94f0

Update app.py

Browse files

Files changed (1) hide show

app.py +34 -6

app.py CHANGED Viewed

@@ -353,12 +353,12 @@ def summarize_web_results(query: str, search_results: List[Dict[str, str]], conv
     except Exception as e:
         return f"An error occurred during summarization: {str(e)}"
-def get_response_from_gemini(query, context, file_type, num_calls=1, temperature=0.2):
     # Configure the Gemini API
     genai.configure(api_key=os.environ["GEMINI_API_KEY"])
     # Define the model
-    model = genai.GenerativeModel(
         model_name="gemini-1.5-flash",
         generation_config={
             "temperature": temperature,
@@ -368,27 +368,55 @@ def get_response_from_gemini(query, context, file_type, num_calls=1, temperature
         },
     )
-    # Create the system instruction based on file type
     if file_type == "excel":
         system_instruction = """You are a highly specialized data analyst with expertise in Excel spreadsheets.
         Your task is to analyze the provided Excel data and answer the user's query accurately and concisely.
         Focus on identifying key metrics, trends, and significant details relevant to the query.
         Do not make assumptions or include information not explicitly supported by the dataset."""
     elif file_type == "pdf":
         system_instruction = """You are a highly specialized document analyst with expertise in extracting information from PDF documents.
         Your task is to analyze the provided PDF content and answer the user's query accurately and comprehensively.
         Focus on key points, important details, and relevant information from the document.
         Ensure your response is strictly based on the provided context."""
     else:
         raise ValueError("Invalid file type. Use 'excel' or 'pdf'.")
-    full_prompt = f"{system_instruction}\n\nContext:\n{context}\n\nUser query: {query}"
     full_response = ""
     for _ in range(num_calls):
         try:
             # Generate content with streaming enabled
-            response = model.generate_content(full_prompt, stream=True)
             for chunk in response:
                 if chunk.text:
                     full_response += chunk.text

     except Exception as e:
         return f"An error occurred during summarization: {str(e)}"
+def get_response_from_gemini(query, model, selected_docs, file_type, num_calls=1, temperature=0.2):
     # Configure the Gemini API
     genai.configure(api_key=os.environ["GEMINI_API_KEY"])
     # Define the model
+    gemini_model = genai.GenerativeModel(
         model_name="gemini-1.5-flash",
         generation_config={
             "temperature": temperature,
         },
     )
     if file_type == "excel":
+        # Excel functionality remains the same
         system_instruction = """You are a highly specialized data analyst with expertise in Excel spreadsheets.
         Your task is to analyze the provided Excel data and answer the user's query accurately and concisely.
         Focus on identifying key metrics, trends, and significant details relevant to the query.
         Do not make assumptions or include information not explicitly supported by the dataset."""
+        full_prompt = f"{system_instruction}\n\nContext:\n{selected_docs}\n\nUser query: {query}"
     elif file_type == "pdf":
+        # PDF functionality similar to get_response_from_pdf
+        embed = get_embeddings()
+        if os.path.exists("faiss_database"):
+            database = FAISS.load_local("faiss_database", embed, allow_dangerous_deserialization=True)
+        else:
+            yield "No documents available. Please upload PDF documents to answer questions."
+            return
+        # Pre-filter the documents
+        filtered_docs = [doc for doc_id, doc in database.docstore._dict.items()
+                         if isinstance(doc, Document) and doc.metadata.get("source") in selected_docs]
+        if not filtered_docs:
+            yield "No relevant information found in the selected documents. Please try selecting different documents or rephrasing your query."
+            return
+        # Create a new FAISS index with only the selected documents
+        filtered_db = FAISS.from_documents(filtered_docs, embed)
+        retriever = filtered_db.as_retriever(search_kwargs={"k": 10})
+        relevant_docs = retriever.get_relevant_documents(query)
+        context_str = "\n".join([doc.page_content for doc in relevant_docs])
         system_instruction = """You are a highly specialized document analyst with expertise in extracting information from PDF documents.
         Your task is to analyze the provided PDF content and answer the user's query accurately and comprehensively.
         Focus on key points, important details, and relevant information from the document.
         Ensure your response is strictly based on the provided context."""
+        full_prompt = f"{system_instruction}\n\nContext:\n{context_str}\n\nUser query: {query}\n\nPlease generate a step-by-step reasoning before arriving at a comprehensive and accurate summary addressing the question. Ensure your response is strictly based on the provided context, highlighting key metrics, trends, and significant details relevant to the query. Avoid any speculative or unverified information."
     else:
         raise ValueError("Invalid file type. Use 'excel' or 'pdf'.")
     full_response = ""
     for _ in range(num_calls):
         try:
             # Generate content with streaming enabled
+            response = gemini_model.generate_content(full_prompt, stream=True)
             for chunk in response:
                 if chunk.text:
                     full_response += chunk.text