CPS-Test-Mobile

Paused

App Files Files Community

Ali2206 commited on Apr 12

Commit

9c0d5a4

verified ·

1 Parent(s): 9b25f67

Update app.py

Browse files

Files changed (1) hide show

app.py +53 -120

app.py CHANGED Viewed

@@ -4,51 +4,53 @@ import pandas as pd
 import pdfplumber
 import json
 import gradio as gr
-from typing import List, Optional
 from concurrent.futures import ThreadPoolExecutor, as_completed
 import hashlib
 import shutil
-import time
-from functools import lru_cache
-# Environment and path setup
-current_dir = os.path.dirname(os.path.abspath(__file__))
-src_path = os.path.abspath(os.path.join(current_dir, "src"))
-print(f"Adding to path: {src_path}")
-sys.path.insert(0, src_path)
-# Configure cache directories
-base_dir = "/data"
-model_cache_dir = os.path.join(base_dir, "txagent_models")
-tool_cache_dir = os.path.join(base_dir, "tool_cache")
-file_cache_dir = os.path.join(base_dir, "cache")
 os.makedirs(model_cache_dir, exist_ok=True)
-os.makedirs(tool_cache_dir, exist_ok=True)
-os.makedirs(file_cache_dir, exist_ok=True)
 os.environ["TRANSFORMERS_CACHE"] = model_cache_dir
 os.environ["HF_HOME"] = model_cache_dir
-os.environ["TOKENIZERS_PARALLELISM"] = "false"
-os.environ["CUDA_LAUNCH_BLOCKING"] = "1"
 from txagent.txagent import TxAgent
 def sanitize_utf8(text: str) -> str:
     return text.encode("utf-8", "ignore").decode("utf-8")
-def file_hash(path: str) -> str:
     with open(path, "rb") as f:
         return hashlib.md5(f.read()).hexdigest()
-@lru_cache(maxsize=100)
-def get_cached_response(prompt: str, file_hash: str) -> Optional[str]:
-    return None
 def convert_file_to_json(file_path: str, file_type: str) -> str:
     try:
         h = file_hash(file_path)
-        cache_path = os.path.join(file_cache_dir, f"{h}.json")
         if os.path.exists(cache_path):
             return open(cache_path, "r", encoding="utf-8").read()
@@ -64,8 +66,7 @@ def convert_file_to_json(file_path: str, file_type: str) -> str:
             with pdfplumber.open(file_path) as pdf:
                 text = "\n".join([page.extract_text() or "" for page in pdf.pages])
             result = json.dumps({"filename": os.path.basename(file_path), "content": text.strip()})
-            with open(cache_path, "w", encoding="utf-8") as f:
-                f.write(result)
             return result
         else:
             return json.dumps({"error": f"Unsupported file type: {file_type}"})
@@ -76,49 +77,11 @@ def convert_file_to_json(file_path: str, file_type: str) -> str:
         df = df.fillna("")
         content = df.astype(str).values.tolist()
         result = json.dumps({"filename": os.path.basename(file_path), "rows": content})
-        with open(cache_path, "w", encoding="utf-8") as f:
-            f.write(result)
         return result
     except Exception as e:
         return json.dumps({"error": f"Error reading {os.path.basename(file_path)}: {str(e)}"})
-def convert_files_to_json_parallel(uploaded_files: list) -> str:
-    extracted_text = []
-    with ThreadPoolExecutor(max_workers=4) as executor:
-        futures = []
-        for file in uploaded_files:
-            if not hasattr(file, 'name'):
-                continue
-            path = file.name
-            ext = path.split(".")[-1].lower()
-            futures.append(executor.submit(convert_file_to_json, path, ext))
-        for future in as_completed(futures):
-            extracted_text.append(sanitize_utf8(future.result()))
-    return "\n".join(extracted_text)
-def init_agent():
-    default_tool_path = os.path.abspath("data/new_tool.json")
-    target_tool_path = os.path.join(tool_cache_dir, "new_tool.json")
-    if not os.path.exists(target_tool_path):
-        shutil.copy(default_tool_path, target_tool_path)
-    model_name = "mims-harvard/TxAgent-T1-Llama-3.1-8B"
-    rag_model_name = "mims-harvard/ToolRAG-T1-GTE-Qwen2-1.5B"
-    agent = TxAgent(
-        model_name=model_name,
-        rag_model_name=rag_model_name,
-        tool_files_dict={"new_tool": target_tool_path},
-        force_finish=True,
-        enable_checker=True,
-        step_rag_num=8,
-        seed=100,
-        additional_default_tools=[]
-    )
-    agent.init_model()
-    return agent
 def create_ui(agent: TxAgent):
     with gr.Blocks(theme=gr.themes.Soft()) as demo:
         gr.Markdown("<h1 style='text-align: center;'>📋 CPS: Clinical Patient Support System</h1>")
@@ -134,61 +97,60 @@ def create_ui(agent: TxAgent):
         conversation_state = gr.State([])
         def handle_chat(message: str, history: list, conversation: list, uploaded_files: list, progress=gr.Progress()):
-            start_time = time.time()
             try:
                 history.append({"role": "user", "content": message})
                 history.append({"role": "assistant", "content": "⏳ Processing your request..."})
                 yield history
-                file_process_time = time.time()
                 extracted_text = ""
                 if uploaded_files and isinstance(uploaded_files, list):
-                    extracted_text = convert_files_to_json_parallel(uploaded_files)
-                print(f"File processing took: {time.time() - file_process_time:.2f}s")
                 context = (
-                    "You are an expert clinical AI assistant. Review this patient's history, "
-                    "medications, and notes, and ONLY provide a final answer summarizing "
-                    "what the doctor might have missed."
                 )
                 chunked_prompt = f"{context}\n\n--- Patient Record ---\n{extracted_text}\n\n[Final Analysis]"
-                model_start = time.time()
                 generator = agent.run_gradio_chat(
                     message=chunked_prompt,
                     history=[],
                     temperature=0.3,
-                    max_new_tokens=768,
-                    max_token=4096,
                     call_agent=False,
                     conversation=conversation,
                     uploaded_files=uploaded_files,
-                    max_round=10
                 )
-                final_response = []
                 for update in generator:
                     if not update:
                         continue
-                    if isinstance(update, str):
-                        final_response.append(update)
-                    elif isinstance(update, list):
-                        final_response.extend(msg.content for msg in update if hasattr(msg, 'content'))
-                    if len(final_response) % 3 == 0:
-                        history[-1] = {"role": "assistant", "content": "".join(final_response).strip()}
-                        yield history
-                history[-1] = {"role": "assistant", "content": "".join(final_response).strip() or "❌ No response."}
-                print(f"Model processing took: {time.time() - model_start:.2f}s")
                 yield history
             except Exception as chat_error:
                 print(f"Chat handling error: {chat_error}")
                 history[-1] = {"role": "assistant", "content": "❌ An error occurred while processing your request."}
                 yield history
-            finally:
-                print(f"Total request time: {time.time() - start_time:.2f}s")
         inputs = [message_input, chatbot, conversation_state, file_upload]
         send_button.click(fn=handle_chat, inputs=inputs, outputs=chatbot)
@@ -201,32 +163,3 @@ def create_ui(agent: TxAgent):
         ], inputs=message_input)
     return demo
-if __name__ == "__main__":
-    print("Initializing agent...")
-    agent = init_agent()
-    print("Performing warm-up call...")
-    try:
-        warm_up = agent.run_gradio_chat(
-            message="Warm up",
-            history=[],
-            temperature=0.1,
-            max_new_tokens=10,
-            max_token=100,
-            call_agent=False,
-            conversation=[]
-        )
-        for _ in warm_up:
-            pass
-    except:
-        pass
-    print("Launching interface...")
-    demo = create_ui(agent)
-    demo.queue().launch(
-        server_name="0.0.0.0",
-        server_port=7860,
-        show_error=True,
-        share=True
-    )

 import pdfplumber
 import json
 import gradio as gr
+from typing import List
 from concurrent.futures import ThreadPoolExecutor, as_completed
 import hashlib
 import shutil
+# ✅ Fix: Add src to Python path
+sys.path.insert(0, os.path.abspath(os.path.join(os.path.dirname(__file__), "..", "src")))
+# ✅ Persist model cache to Hugging Face Space's /data directory
+model_cache_dir = "/data/txagent_models"
 os.makedirs(model_cache_dir, exist_ok=True)
 os.environ["TRANSFORMERS_CACHE"] = model_cache_dir
 os.environ["HF_HOME"] = model_cache_dir
 from txagent.txagent import TxAgent
 def sanitize_utf8(text: str) -> str:
     return text.encode("utf-8", "ignore").decode("utf-8")
+def clean_final_response(text: str) -> str:
+    cleaned = text.replace("[TOOL_CALLS]", "").strip()
+    responses = cleaned.split("[Final Analysis]")
+    if len(responses) <= 1:
+        return f"<div style='padding:1em;border:1px solid #ccc;border-radius:12px;color:#fff;background:#353F54;'><p>{cleaned}</p></div>"
+    panels = []
+    for i, section in enumerate(responses[1:], 1):
+        final = section.strip()
+        panels.append(
+            f"<div style='background:#2B2B2B;color:#E0E0E0;border-radius:12px;margin-bottom:1em;border:1px solid #888;'>"
+            f"<div style='font-size:1.1em;font-weight:bold;padding:0.75em;background:#3A3A3A;color:#fff;border-radius:12px 12px 0 0;'>🧠 Final Analysis #{i}</div>"
+            f"<div style='padding:1em;line-height:1.6;'>{final.replace(chr(10), '<br>')}</div>"
+            f"</div>"
+        )
+    return "".join(panels)
+def file_hash(path):
     with open(path, "rb") as f:
         return hashlib.md5(f.read()).hexdigest()
 def convert_file_to_json(file_path: str, file_type: str) -> str:
     try:
+        cache_dir = "/data/cache"
+        os.makedirs(cache_dir, exist_ok=True)
         h = file_hash(file_path)
+        cache_path = os.path.join(cache_dir, f"{h}.json")
         if os.path.exists(cache_path):
             return open(cache_path, "r", encoding="utf-8").read()
             with pdfplumber.open(file_path) as pdf:
                 text = "\n".join([page.extract_text() or "" for page in pdf.pages])
             result = json.dumps({"filename": os.path.basename(file_path), "content": text.strip()})
+            open(cache_path, "w", encoding="utf-8").write(result)
             return result
         else:
             return json.dumps({"error": f"Unsupported file type: {file_type}"})
         df = df.fillna("")
         content = df.astype(str).values.tolist()
         result = json.dumps({"filename": os.path.basename(file_path), "rows": content})
+        open(cache_path, "w", encoding="utf-8").write(result)
         return result
     except Exception as e:
         return json.dumps({"error": f"Error reading {os.path.basename(file_path)}: {str(e)}"})
 def create_ui(agent: TxAgent):
     with gr.Blocks(theme=gr.themes.Soft()) as demo:
         gr.Markdown("<h1 style='text-align: center;'>📋 CPS: Clinical Patient Support System</h1>")
         conversation_state = gr.State([])
         def handle_chat(message: str, history: list, conversation: list, uploaded_files: list, progress=gr.Progress()):
             try:
                 history.append({"role": "user", "content": message})
                 history.append({"role": "assistant", "content": "⏳ Processing your request..."})
                 yield history
                 extracted_text = ""
                 if uploaded_files and isinstance(uploaded_files, list):
+                    for file in uploaded_files:
+                        if not hasattr(file, 'name'):
+                            continue
+                        path = file.name
+                        ext = path.split(".")[-1].lower()
+                        json_text = convert_file_to_json(path, ext)
+                        extracted_text += sanitize_utf8(json_text) + "\n"
                 context = (
+                    "You are an expert clinical AI assistant. Review this patient's history, medications, and notes, and ONLY provide a final answer summarizing what the doctor might have missed."
                 )
                 chunked_prompt = f"{context}\n\n--- Patient Record ---\n{extracted_text}\n\n[Final Analysis]"
                 generator = agent.run_gradio_chat(
                     message=chunked_prompt,
                     history=[],
                     temperature=0.3,
+                    max_new_tokens=1024,
+                    max_token=8192,
                     call_agent=False,
                     conversation=conversation,
                     uploaded_files=uploaded_files,
+                    max_round=30
                 )
+                final_response = ""
                 for update in generator:
                     if not update:
                         continue
+                    if isinstance(update, list):
+                        for msg in update:
+                            if hasattr(msg, "content"):
+                                final_response += msg.content
+                    elif isinstance(update, str):
+                        final_response += update
+                    history[-1] = {"role": "assistant", "content": final_response.strip()}
+                    yield history
+                cleaned = final_response.strip().replace("[TOOL_CALLS]", "").strip()
+                history[-1] = {"role": "assistant", "content": cleaned or "❌ No response."}
                 yield history
             except Exception as chat_error:
                 print(f"Chat handling error: {chat_error}")
                 history[-1] = {"role": "assistant", "content": "❌ An error occurred while processing your request."}
                 yield history
         inputs = [message_input, chatbot, conversation_state, file_upload]
         send_button.click(fn=handle_chat, inputs=inputs, outputs=chatbot)
         ], inputs=message_input)
     return demo