CPS-Test-Mobile

Paused

App Files Files Community

Ali2206 commited on Apr 12

Commit

e24be23

verified ·

1 Parent(s): 9c0d5a4

Update app.py

Browse files

Files changed (1) hide show

app.py +124 -52

app.py CHANGED Viewed

@@ -4,53 +4,51 @@ import pandas as pd
 import pdfplumber
 import json
 import gradio as gr
-from typing import List
 from concurrent.futures import ThreadPoolExecutor, as_completed
 import hashlib
 import shutil
-# ✅ Fix: Add src to Python path
-sys.path.insert(0, os.path.abspath(os.path.join(os.path.dirname(__file__), "..", "src")))
-# ✅ Persist model cache to Hugging Face Space's /data directory
-model_cache_dir = "/data/txagent_models"
 os.makedirs(model_cache_dir, exist_ok=True)
 os.environ["TRANSFORMERS_CACHE"] = model_cache_dir
 os.environ["HF_HOME"] = model_cache_dir
 from txagent.txagent import TxAgent
 def sanitize_utf8(text: str) -> str:
     return text.encode("utf-8", "ignore").decode("utf-8")
-def clean_final_response(text: str) -> str:
-    cleaned = text.replace("[TOOL_CALLS]", "").strip()
-    responses = cleaned.split("[Final Analysis]")
-    if len(responses) <= 1:
-        return f"<div style='padding:1em;border:1px solid #ccc;border-radius:12px;color:#fff;background:#353F54;'><p>{cleaned}</p></div>"
-    panels = []
-    for i, section in enumerate(responses[1:], 1):
-        final = section.strip()
-        panels.append(
-            f"<div style='background:#2B2B2B;color:#E0E0E0;border-radius:12px;margin-bottom:1em;border:1px solid #888;'>"
-            f"<div style='font-size:1.1em;font-weight:bold;padding:0.75em;background:#3A3A3A;color:#fff;border-radius:12px 12px 0 0;'>🧠 Final Analysis #{i}</div>"
-            f"<div style='padding:1em;line-height:1.6;'>{final.replace(chr(10), '<br>')}</div>"
-            f"</div>"
-        )
-    return "".join(panels)
-def file_hash(path):
     with open(path, "rb") as f:
         return hashlib.md5(f.read()).hexdigest()
 def convert_file_to_json(file_path: str, file_type: str) -> str:
     try:
-        cache_dir = "/data/cache"
-        os.makedirs(cache_dir, exist_ok=True)
         h = file_hash(file_path)
-        cache_path = os.path.join(cache_dir, f"{h}.json")
         if os.path.exists(cache_path):
             return open(cache_path, "r", encoding="utf-8").read()
@@ -66,7 +64,8 @@ def convert_file_to_json(file_path: str, file_type: str) -> str:
             with pdfplumber.open(file_path) as pdf:
                 text = "\n".join([page.extract_text() or "" for page in pdf.pages])
             result = json.dumps({"filename": os.path.basename(file_path), "content": text.strip()})
-            open(cache_path, "w", encoding="utf-8").write(result)
             return result
         else:
             return json.dumps({"error": f"Unsupported file type: {file_type}"})
@@ -77,11 +76,49 @@ def convert_file_to_json(file_path: str, file_type: str) -> str:
         df = df.fillna("")
         content = df.astype(str).values.tolist()
         result = json.dumps({"filename": os.path.basename(file_path), "rows": content})
-        open(cache_path, "w", encoding="utf-8").write(result)
         return result
     except Exception as e:
         return json.dumps({"error": f"Error reading {os.path.basename(file_path)}: {str(e)}"})
 def create_ui(agent: TxAgent):
     with gr.Blocks(theme=gr.themes.Soft()) as demo:
         gr.Markdown("<h1 style='text-align: center;'>📋 CPS: Clinical Patient Support System</h1>")
@@ -97,60 +134,66 @@ def create_ui(agent: TxAgent):
         conversation_state = gr.State([])
         def handle_chat(message: str, history: list, conversation: list, uploaded_files: list, progress=gr.Progress()):
             try:
                 history.append({"role": "user", "content": message})
                 history.append({"role": "assistant", "content": "⏳ Processing your request..."})
                 yield history
                 extracted_text = ""
                 if uploaded_files and isinstance(uploaded_files, list):
-                    for file in uploaded_files:
-                        if not hasattr(file, 'name'):
-                            continue
-                        path = file.name
-                        ext = path.split(".")[-1].lower()
-                        json_text = convert_file_to_json(path, ext)
-                        extracted_text += sanitize_utf8(json_text) + "\n"
                 context = (
-                    "You are an expert clinical AI assistant. Review this patient's history, medications, and notes, and ONLY provide a final answer summarizing what the doctor might have missed."
                 )
                 chunked_prompt = f"{context}\n\n--- Patient Record ---\n{extracted_text}\n\n[Final Analysis]"
                 generator = agent.run_gradio_chat(
                     message=chunked_prompt,
                     history=[],
                     temperature=0.3,
-                    max_new_tokens=1024,
-                    max_token=8192,
                     call_agent=False,
                     conversation=conversation,
                     uploaded_files=uploaded_files,
-                    max_round=30
                 )
-                final_response = ""
                 for update in generator:
                     if not update:
                         continue
-                    if isinstance(update, list):
                         for msg in update:
-                            if hasattr(msg, "content"):
-                                final_response += msg.content
-                    elif isinstance(update, str):
-                        final_response += update
-                    history[-1] = {"role": "assistant", "content": final_response.strip()}
-                    yield history
-                cleaned = final_response.strip().replace("[TOOL_CALLS]", "").strip()
-                history[-1] = {"role": "assistant", "content": cleaned or "❌ No response."}
                 yield history
             except Exception as chat_error:
                 print(f"Chat handling error: {chat_error}")
                 history[-1] = {"role": "assistant", "content": "❌ An error occurred while processing your request."}
                 yield history
         inputs = [message_input, chatbot, conversation_state, file_upload]
         send_button.click(fn=handle_chat, inputs=inputs, outputs=chatbot)
@@ -163,3 +206,32 @@ def create_ui(agent: TxAgent):
         ], inputs=message_input)
     return demo

 import pdfplumber
 import json
 import gradio as gr
+from typing import List, Optional
 from concurrent.futures import ThreadPoolExecutor, as_completed
 import hashlib
 import shutil
+import time
+from functools import lru_cache
+# Environment and path setup
+current_dir = os.path.dirname(os.path.abspath(__file__))
+src_path = os.path.abspath(os.path.join(current_dir, "src"))
+print(f"Adding to path: {src_path}")
+sys.path.insert(0, src_path)
+# Configure cache directories
+base_dir = "/data"
+model_cache_dir = os.path.join(base_dir, "txagent_models")
+tool_cache_dir = os.path.join(base_dir, "tool_cache")
+file_cache_dir = os.path.join(base_dir, "cache")
 os.makedirs(model_cache_dir, exist_ok=True)
+os.makedirs(tool_cache_dir, exist_ok=True)
+os.makedirs(file_cache_dir, exist_ok=True)
 os.environ["TRANSFORMERS_CACHE"] = model_cache_dir
 os.environ["HF_HOME"] = model_cache_dir
+os.environ["TOKENIZERS_PARALLELISM"] = "false"
+os.environ["CUDA_LAUNCH_BLOCKING"] = "1"
 from txagent.txagent import TxAgent
 def sanitize_utf8(text: str) -> str:
     return text.encode("utf-8", "ignore").decode("utf-8")
+def file_hash(path: str) -> str:
     with open(path, "rb") as f:
         return hashlib.md5(f.read()).hexdigest()
+@lru_cache(maxsize=100)
+def get_cached_response(prompt: str, file_hash: str) -> Optional[str]:
+    return None
 def convert_file_to_json(file_path: str, file_type: str) -> str:
     try:
         h = file_hash(file_path)
+        cache_path = os.path.join(file_cache_dir, f"{h}.json")
         if os.path.exists(cache_path):
             return open(cache_path, "r", encoding="utf-8").read()
             with pdfplumber.open(file_path) as pdf:
                 text = "\n".join([page.extract_text() or "" for page in pdf.pages])
             result = json.dumps({"filename": os.path.basename(file_path), "content": text.strip()})
+            with open(cache_path, "w", encoding="utf-8") as f:
+                f.write(result)
             return result
         else:
             return json.dumps({"error": f"Unsupported file type: {file_type}"})
         df = df.fillna("")
         content = df.astype(str).values.tolist()
         result = json.dumps({"filename": os.path.basename(file_path), "rows": content})
+        with open(cache_path, "w", encoding="utf-8") as f:
+            f.write(result)
         return result
     except Exception as e:
         return json.dumps({"error": f"Error reading {os.path.basename(file_path)}: {str(e)}"})
+def convert_files_to_json_parallel(uploaded_files: list) -> str:
+    extracted_text = []
+    with ThreadPoolExecutor(max_workers=4) as executor:
+        futures = []
+        for file in uploaded_files:
+            if not hasattr(file, 'name'):
+                continue
+            path = file.name
+            ext = path.split(".")[-1].lower()
+            futures.append(executor.submit(convert_file_to_json, path, ext))
+        for future in as_completed(futures):
+            extracted_text.append(sanitize_utf8(future.result()))
+    return "\n".join(extracted_text)
+def init_agent():
+    default_tool_path = os.path.abspath("data/new_tool.json")
+    target_tool_path = os.path.join(tool_cache_dir, "new_tool.json")
+    if not os.path.exists(target_tool_path):
+        shutil.copy(default_tool_path, target_tool_path)
+    model_name = "mims-harvard/TxAgent-T1-Llama-3.1-8B"
+    rag_model_name = "mims-harvard/ToolRAG-T1-GTE-Qwen2-1.5B"
+    agent = TxAgent(
+        model_name=model_name,
+        rag_model_name=rag_model_name,
+        tool_files_dict={"new_tool": target_tool_path},
+        force_finish=True,
+        enable_checker=True,
+        step_rag_num=8,
+        seed=100,
+        additional_default_tools=[]
+    )
+    agent.init_model()
+    return agent
 def create_ui(agent: TxAgent):
     with gr.Blocks(theme=gr.themes.Soft()) as demo:
         gr.Markdown("<h1 style='text-align: center;'>📋 CPS: Clinical Patient Support System</h1>")
         conversation_state = gr.State([])
         def handle_chat(message: str, history: list, conversation: list, uploaded_files: list, progress=gr.Progress()):
+            start_time = time.time()
             try:
                 history.append({"role": "user", "content": message})
                 history.append({"role": "assistant", "content": "⏳ Processing your request..."})
                 yield history
+                file_process_time = time.time()
                 extracted_text = ""
                 if uploaded_files and isinstance(uploaded_files, list):
+                    extracted_text = convert_files_to_json_parallel(uploaded_files)
+                print(f"File processing took: {time.time() - file_process_time:.2f}s")
                 context = (
+                    "You are an expert clinical AI assistant. Review this patient's history, "
+                    "medications, and notes, and ONLY provide a final answer summarizing "
+                    "what the doctor might have missed."
                 )
                 chunked_prompt = f"{context}\n\n--- Patient Record ---\n{extracted_text}\n\n[Final Analysis]"
+                model_start = time.time()
                 generator = agent.run_gradio_chat(
                     message=chunked_prompt,
                     history=[],
                     temperature=0.3,
+                    max_new_tokens=768,
+                    max_token=4096,
                     call_agent=False,
                     conversation=conversation,
                     uploaded_files=uploaded_files,
+                    max_round=10
                 )
+                final_response = []
                 for update in generator:
                     if not update:
                         continue
+                    if isinstance(update, str):
+                        final_response.append(update)
+                    elif isinstance(update, list):
                         for msg in update:
+                            if hasattr(msg, 'content'):
+                                final_response.append(msg.content)
+                    if len(final_response) % 3 == 0:
+                        content = "".join(final_response).strip().replace("[TOOL_CALLS]", "")
+                        history[-1] = {"role": "assistant", "content": content or "❌ No response."}
+                        yield history
+                final_cleaned = "".join(final_response).strip().replace("[TOOL_CALLS]", "")
+                history[-1] = {"role": "assistant", "content": final_cleaned or "❌ No response."}
+                print("Final model response:\n", final_cleaned)
+                print(f"Model processing took: {time.time() - model_start:.2f}s")
                 yield history
             except Exception as chat_error:
                 print(f"Chat handling error: {chat_error}")
                 history[-1] = {"role": "assistant", "content": "❌ An error occurred while processing your request."}
                 yield history
+            finally:
+                print(f"Total request time: {time.time() - start_time:.2f}s")
         inputs = [message_input, chatbot, conversation_state, file_upload]
         send_button.click(fn=handle_chat, inputs=inputs, outputs=chatbot)
         ], inputs=message_input)
     return demo
+if __name__ == "__main__":
+    print("Initializing agent...")
+    agent = init_agent()
+    print("Performing warm-up call...")
+    try:
+        warm_up = agent.run_gradio_chat(
+            message="Warm up",
+            history=[],
+            temperature=0.1,
+            max_new_tokens=10,
+            max_token=100,
+            call_agent=False,
+            conversation=[]
+        )
+        for _ in warm_up:
+            pass
+    except:
+        pass
+    print("Launching interface...")
+    demo = create_ui(agent)
+    demo.queue().launch(
+        server_name="0.0.0.0",
+        server_port=7860,
+        show_error=True,
+        share=True
+    )