multimodal-chat-MBTI-ISFP

Running on Zero

App Files Files Community

seawolf2357 commited on Mar 17

Commit

f3a07fd

verified ·

1 Parent(s): c19847c

Update app.py

Browse files

Files changed (1) hide show

app.py +13 -13

app.py CHANGED Viewed

@@ -5,8 +5,8 @@ import re
 import tempfile
 from collections.abc import Iterator
 from threading import Thread
-import requests  # <-- For SERPHouse web search
 import cv2
 import gradio as gr
 import spaces
@@ -22,7 +22,7 @@ import pandas as pd
 import PyPDF2
 ##############################################################################
-# SERPHouse API key from environment variable
 ##############################################################################
 SERPHOUSE_API_KEY = os.getenv("SERPHOUSE_API_KEY", "")
@@ -44,11 +44,12 @@ def extract_keywords(text: str, top_k: int = 5) -> str:
     return " ".join(key_tokens)
 ##############################################################################
-# SERPHouse Live endpoint 호출 (상위 20개의 제목을 얻음)
 ##############################################################################
 def do_web_search(query: str) -> str:
     """
-    SERPHouse 라이브 검색 호출, 상위 20개 결과의 'title'만 묶어서 반환.
     """
     try:
         url = "https://api.serphouse.com/serp/live"
@@ -70,10 +71,12 @@ def do_web_search(query: str) -> str:
         if not organic:
             return "No web search results found."
         summary_lines = []
         for idx, item in enumerate(organic[:20], start=1):
-            title = item.get("title", "No Title")
-            summary_lines.append(f"{idx}. {title}")
         return "\n".join(summary_lines)
     except Exception as e:
@@ -144,7 +147,6 @@ def pdf_to_markdown(pdf_path: str) -> str:
                 page_text = page.extract_text() or ""
                 page_text = page_text.strip()
                 if page_text:
-                    # 페이지별 텍스트 제한
                     if len(page_text) > MAX_CONTENT_CHARS // max_pages:
                         page_text = page_text[:MAX_CONTENT_CHARS // max_pages] + "...(truncated)"
                     text_chunks.append(f"## Page {page_num+1}\n\n{page_text}\n")
@@ -396,18 +398,17 @@ def run(
         return
     try:
-        # web_search가 True면 => 사용자가 직접 입력한 web_search_query 대신,
-        # message["text"]를 기반으로 키워드 추출하여 검색
         history_system_msg = None
         if use_web_search:
             user_text = message["text"]
             # 1) 키워드 추출
             ws_query = extract_keywords(user_text, top_k=5)
             logger.info(f"[Auto WebSearch Keyword] {ws_query!r}")
-            # 2) 상위 20개 결과 불러오기
             ws_result = do_web_search(ws_query)
             # 3) 이를 system 메시지로 추가
-            system_search_content = f"[Search top-20 Titles Based on user prompt]\n{ws_result}\n"
             if system_search_content.strip():
                 history_system_msg = {
                     "role": "system",
@@ -644,7 +645,6 @@ with gr.Blocks(css=css, title="Vidraft-Gemma-3-27B") as demo:
                     value=False,
                     info="Check to enable a SERPHouse web search (auto keywords) before the chat reply"
                 )
-            # 실제로는 자동추출. 아래 textbox는 미사용.
             web_search_text = gr.Textbox(
                 lines=1,
                 label="(Unused) Web Search Query",

 import tempfile
 from collections.abc import Iterator
 from threading import Thread
+import json  # ← JSON 변환을 위해 추가
+import requests  # SERPHouse web search
 import cv2
 import gradio as gr
 import spaces
 import PyPDF2
 ##############################################################################
+# SERPHouse API key from environment variable (사용자가 환경변수로 지정해야 함)
 ##############################################################################
 SERPHOUSE_API_KEY = os.getenv("SERPHOUSE_API_KEY", "")
     return " ".join(key_tokens)
 ##############################################################################
+# SERPHouse Live endpoint 호출
+# - 상위 20개 결과 모두 "전체 item"을 system msg에 담아(=JSON 그대로) LLM이 참조
 ##############################################################################
 def do_web_search(query: str) -> str:
     """
+    SERPHouse 라이브 검색 호출, 상위 20개 'organic' 결과 전체를 JSON 형태로 묶어서 반환.
     """
     try:
         url = "https://api.serphouse.com/serp/live"
         if not organic:
             return "No web search results found."
+        # 각 item을 JSON(전체 필드)으로 변환하여 저장
         summary_lines = []
         for idx, item in enumerate(organic[:20], start=1):
+            # item 전체를 JSON 문자열로 변환
+            item_json = json.dumps(item, ensure_ascii=False, indent=2)
+            summary_lines.append(f"Result {idx}:\n{item_json}\n")
         return "\n".join(summary_lines)
     except Exception as e:
                 page_text = page.extract_text() or ""
                 page_text = page_text.strip()
                 if page_text:
                     if len(page_text) > MAX_CONTENT_CHARS // max_pages:
                         page_text = page_text[:MAX_CONTENT_CHARS // max_pages] + "...(truncated)"
                     text_chunks.append(f"## Page {page_num+1}\n\n{page_text}\n")
         return
     try:
+        # web_search가 True면 => message["text"]를 기반으로 키워드 추출하여 SERPHouse 호출
         history_system_msg = None
         if use_web_search:
             user_text = message["text"]
             # 1) 키워드 추출
             ws_query = extract_keywords(user_text, top_k=5)
             logger.info(f"[Auto WebSearch Keyword] {ws_query!r}")
+            # 2) 상위 20개 결과 (item 전체) 가져오기
             ws_result = do_web_search(ws_query)
             # 3) 이를 system 메시지로 추가
+            system_search_content = f"[Search top-20 Full Items Based on user prompt]\n{ws_result}\n"
             if system_search_content.strip():
                 history_system_msg = {
                     "role": "system",
                     value=False,
                     info="Check to enable a SERPHouse web search (auto keywords) before the chat reply"
                 )
             web_search_text = gr.Textbox(
                 lines=1,
                 label="(Unused) Web Search Query",