CPS-Test-Mobile

Paused

App Files Files Community

Ali2206 commited on Apr 14

Commit

20d61bd

verified ·

1 Parent(s): b92dc05

Update app.py

Browse files

Files changed (1) hide show

app.py +48 -17

app.py CHANGED Viewed

@@ -1,4 +1,9 @@
 from typing import List
 from concurrent.futures import ThreadPoolExecutor, as_completed
 import hashlib
@@ -51,7 +56,7 @@ def extract_priority_pages(file_path: str, max_pages: int = 20) -> str:
                 text_chunks.append(f"=== Page {i+1} ===\n{text.strip()}")
             for i, page in enumerate(pdf.pages[3:max_pages], start=4):
                 page_text = page.extract_text() or ""
-                if any(re.search(rf'\\b{kw}\\b', page_text.lower()) for kw in MEDICAL_KEYWORDS):
                     text_chunks.append(f"=== Page {i} ===\n{page_text.strip()}")
         return "\n\n".join(text_chunks)
     except Exception as e:
@@ -126,6 +131,30 @@ def init_agent():
     print("✅ Agent Ready")
     return agent
 def create_ui(agent):
     with gr.Blocks(theme=gr.themes.Soft()) as demo:
         gr.Markdown("<h1 style='text-align: center;'>🩺 Clinical Oversight Assistant</h1>")
@@ -163,8 +192,6 @@ Medical Records:
             try:
                 response = ""
-                finish_detected = False
                 for chunk in agent.run_gradio_chat(
                     message=prompt,
                     history=[],
@@ -179,18 +206,22 @@ Medical Records:
                     if isinstance(chunk, str):
                         response += chunk
                     elif isinstance(chunk, list):
-                        chunk_str = "".join([c.content for c in chunk if hasattr(c, "content") and c.content])
-                        response += chunk_str
-                        if '"name": "Finish"' in chunk_str:
-                            finish_detected = True
-                clean_response = response.rsplit("[TOOL_CALLS]", 1)[0].strip()
-                print("🔎 Final Cleaned Response:", repr(clean_response))
-                if not clean_response:
-                    clean_response = "⚠️ No clear oversights identified or model output was invalid."
-                history[-1] = {"role": "assistant", "content": clean_response}
-                report_path = os.path.join(report_dir, f"{file_hash_value}_report.txt") if file_hash_value else None
                 yield history, report_path if report_path and os.path.exists(report_path) else None
             except Exception as e:
@@ -212,4 +243,4 @@ if __name__ == "__main__":
         show_error=True,
         allowed_paths=[report_dir],
         share=False
-    )

+import sys
+import os
+import pandas as pd
+import pdfplumber
+import json
+import gradio as gr
 from typing import List
 from concurrent.futures import ThreadPoolExecutor, as_completed
 import hashlib
                 text_chunks.append(f"=== Page {i+1} ===\n{text.strip()}")
             for i, page in enumerate(pdf.pages[3:max_pages], start=4):
                 page_text = page.extract_text() or ""
+                if any(re.search(rf'\b{kw}\b', page_text.lower()) for kw in MEDICAL_KEYWORDS):
                     text_chunks.append(f"=== Page {i} ===\n{page_text.strip()}")
         return "\n\n".join(text_chunks)
     except Exception as e:
     print("✅ Agent Ready")
     return agent
+def clean_response(response: str) -> str:
+    """Clean the response by removing tool calls and duplicate content."""
+    # Remove all tool call blocks
+    response = re.sub(r'\[TOOL_CALLS\].*?$', '', response, flags=re.DOTALL)
+    # Remove duplicate sentences (simple approach)
+    sentences = [s.strip() for s in response.split('.') if s.strip()]
+    unique_sentences = []
+    seen_sentences = set()
+    for sentence in sentences:
+        if sentence not in seen_sentences:
+            seen_sentences.add(sentence)
+            unique_sentences.append(sentence)
+    # Reconstruct the response
+    cleaned = '. '.join(unique_sentences) + '.' if unique_sentences else response
+    # Remove any remaining JSON-like artifacts
+    cleaned = re.sub(r'\{.*?\}', '', cleaned)
+    cleaned = re.sub(r'\[.*?\]', '', cleaned)
+    return cleaned.strip()
 def create_ui(agent):
     with gr.Blocks(theme=gr.themes.Soft()) as demo:
         gr.Markdown("<h1 style='text-align: center;'>🩺 Clinical Oversight Assistant</h1>")
             try:
                 response = ""
                 for chunk in agent.run_gradio_chat(
                     message=prompt,
                     history=[],
                     if isinstance(chunk, str):
                         response += chunk
                     elif isinstance(chunk, list):
+                        response += "".join([c.content for c in chunk if hasattr(c, "content") and c.content])
+                # Clean the response before displaying
+                clean_response_text = clean_response(response)
+                if not clean_response_text:
+                    clean_response_text = "⚠️ No clear oversights identified or model output was invalid."
+                # Save the full report
+                report_path = None
+                if file_hash_value:
+                    report_path = os.path.join(report_dir, f"{file_hash_value}_report.txt")
+                    with open(report_path, "w", encoding="utf-8") as f:
+                        f.write(clean_response_text)
+                history[-1] = {"role": "assistant", "content": clean_response_text}
                 yield history, report_path if report_path and os.path.exists(report_path) else None
             except Exception as e:
         show_error=True,
         allowed_paths=[report_dir],
         share=False
+    )