multimodal-chat-MBTI-ISFP

Sleeping

App Files Files Community

seawolf2357 commited on Mar 17

Commit

3634066

verified ·

1 Parent(s): 05dc4f5

Update app-backup.py

Browse files

Files changed (1) hide show

app-backup.py +399 -142

app-backup.py CHANGED Viewed

@@ -6,6 +6,7 @@ import tempfile
 from collections.abc import Iterator
 from threading import Thread
 import cv2
 import gradio as gr
 import spaces
@@ -20,7 +21,55 @@ import pandas as pd
 # PDF 텍스트 추출
 import PyPDF2
-MAX_CONTENT_CHARS = 8000  # 너무 큰 파일을 막기 위해 최대 표시 8000자
 model_id = os.getenv("MODEL_ID", "google/gemma-3-27b-it")
 processor = AutoProcessor.from_pretrained(model_id, padding_side="left")
@@ -43,6 +92,10 @@ def analyze_csv_file(path: str) -> str:
     """
     try:
         df = pd.read_csv(path)
         df_str = df.to_string()
         if len(df_str) > MAX_CONTENT_CHARS:
             df_str = df_str[:MAX_CONTENT_CHARS] + "\n...(truncated)..."
@@ -73,11 +126,20 @@ def pdf_to_markdown(pdf_path: str) -> str:
     try:
         with open(pdf_path, "rb") as f:
             reader = PyPDF2.PdfReader(f)
-            for page_num, page in enumerate(reader.pages, start=1):
                 page_text = page.extract_text() or ""
                 page_text = page_text.strip()
                 if page_text:
-                    text_chunks.append(f"## Page {page_num}\n\n{page_text}\n")
     except Exception as e:
         return f"Failed to read PDF ({os.path.basename(pdf_path)}): {str(e)}"
@@ -97,7 +159,7 @@ def count_files_in_new_message(paths: list[str]) -> tuple[int, int]:
     for path in paths:
         if path.endswith(".mp4"):
             video_count += 1
-        else:
             image_count += 1
     return image_count, video_count
@@ -108,10 +170,13 @@ def count_files_in_history(history: list[dict]) -> tuple[int, int]:
     for item in history:
         if item["role"] != "user" or isinstance(item["content"], str):
             continue
-        if item["content"][0].endswith(".mp4"):
-            video_count += 1
-        else:
-            image_count += 1
     return image_count, video_count
@@ -123,11 +188,9 @@ def validate_media_constraints(message: dict, history: list[dict]) -> bool:
     - <image> 태그가 있으면 태그 수와 실제 이미지 수 일치
     - CSV, TXT, PDF 등은 여기서 제한하지 않음
     """
     media_files = []
     for f in message["files"]:
-        # 이미지: png/jpg/jpeg/gif/webp
-        # 비디오: mp4
-        # cf) PDF, CSV, TXT 등은 제외
         if re.search(r"\.(png|jpg|jpeg|gif|webp)$", f, re.IGNORECASE) or f.endswith(".mp4"):
             media_files.append(f)
@@ -149,9 +212,15 @@ def validate_media_constraints(message: dict, history: list[dict]) -> bool:
     if video_count == 0 and image_count > MAX_NUM_IMAGES:
         gr.Warning(f"You can upload up to {MAX_NUM_IMAGES} images.")
         return False
-    if "<image>" in message["text"] and message["text"].count("<image>") != new_image_count:
-        gr.Warning("The number of <image> tags in the text does not match the number of images.")
-        return False
     return True
@@ -164,7 +233,8 @@ def downsample_video(video_path: str) -> list[tuple[Image.Image, float]]:
     fps = vidcap.get(cv2.CAP_PROP_FPS)
     total_frames = int(vidcap.get(cv2.CAP_PROP_FRAME_COUNT))
-    frame_interval = int(fps / 3)
     frames = []
     for i in range(0, total_frames, frame_interval):
@@ -175,6 +245,10 @@ def downsample_video(video_path: str) -> list[tuple[Image.Image, float]]:
             pil_image = Image.fromarray(image)
             timestamp = round(i / fps, 2)
             frames.append((pil_image, timestamp))
     vidcap.release()
     return frames
@@ -200,9 +274,13 @@ def process_interleaved_images(message: dict) -> list[dict]:
     parts = re.split(r"(<image>)", message["text"])
     content = []
     image_index = 0
     for part in parts:
-        if part == "<image>":
-            content.append({"type": "image", "url": message["files"][image_index]})
             image_index += 1
         elif part.strip():
             content.append({"type": "text", "text": part.strip()})
@@ -216,13 +294,30 @@ def process_interleaved_images(message: dict) -> list[dict]:
 ##################################################
 # PDF + CSV + TXT + 이미지/비디오
 ##################################################
 def process_new_user_message(message: dict) -> list[dict]:
     if not message["files"]:
         return [{"type": "text", "text": message["text"]}]
     # 1) 파일 분류
-    video_files = [f for f in message["files"] if f.endswith(".mp4")]
-    image_files = [f for f in message["files"] if re.search(r"\.(png|jpg|jpeg|gif|webp)$", f, re.IGNORECASE)]
     csv_files = [f for f in message["files"] if f.lower().endswith(".csv")]
     txt_files = [f for f in message["files"] if f.lower().endswith(".txt")]
     pdf_files = [f for f in message["files"] if f.lower().endswith(".pdf")]
@@ -251,9 +346,13 @@ def process_new_user_message(message: dict) -> list[dict]:
         return content_list
     # 7) 이미지 처리
-    if "<image>" in message["text"]:
         # interleaved
-        return process_interleaved_images(message)
     else:
         # 일반 여러 장
         for img_path in image_files:
@@ -281,9 +380,18 @@ def process_history(history: list[dict]) -> list[dict]:
             content = item["content"]
             if isinstance(content, str):
                 current_user_content.append({"type": "text", "text": content})
-            else:
-                # 이미지나 기타
-                current_user_content.append({"type": "image", "url": content[0]})
     return messages
@@ -291,43 +399,100 @@ def process_history(history: list[dict]) -> list[dict]:
 # 메인 추론 함수
 ##################################################
 @spaces.GPU(duration=120)
-def run(message: dict, history: list[dict], system_prompt: str = "", max_new_tokens: int = 512) -> Iterator[str]:
     if not validate_media_constraints(message, history):
         yield ""
         return
-    messages = []
-    if system_prompt:
-        messages.append({"role": "system", "content": [{"type": "text", "text": system_prompt}]})
-    messages.extend(process_history(history))
-    messages.append({"role": "user", "content": process_new_user_message(message)})
-    inputs = processor.apply_chat_template(
-        messages,
-        add_generation_prompt=True,
-        tokenize=True,
-        return_dict=True,
-        return_tensors="pt",
-    ).to(device=model.device, dtype=torch.bfloat16)
-    streamer = TextIteratorStreamer(processor, timeout=30.0, skip_prompt=True, skip_special_tokens=True)
-    gen_kwargs = dict(
-        inputs,
-        streamer=streamer,
-        max_new_tokens=max_new_tokens,
-    )
-    t = Thread(target=model.generate, kwargs=gen_kwargs)
-    t.start()
-    output = ""
-    for new_text in streamer:
-        output += new_text
-        yield output
-##################################################
-# 예시들 (기존)
-##################################################
 ##################################################
 # 예시들 (한글화 버전)
 ##################################################
@@ -335,8 +500,12 @@ examples = [
     [
         {
-            "text": "PDF 파일 내용을 요약, 분석하라.",
             "files": ["assets/additional-examples/pdf.pdf"],
         }
     ],
     [
@@ -347,45 +516,34 @@ examples = [
     ],
     [
         {
-            "text": "동일한 막대 그래프를 그리는 matplotlib 코드를 작성해주세요.",
-            "files": ["assets/additional-examples/barchart.png"],
         }
-    ],
     [
         {
-            "text": "이 영상에서 이상한 점이 무엇인가요?",
-            "files": ["assets/additional-examples/tmp.mp4"],
         }
-    ],
     [
         {
             "text": "이미 이 영양제를 <image> 가지고 있고, 이 제품 <image>을 새로 사려 합니다. 함께 섭취할 때 주의해야 할 점이 있을까요?",
             "files": ["assets/additional-examples/pill1.png", "assets/additional-examples/pill2.png"],
         }
-    ],
-    [
-        {
-            "text": "이미지의 시각적 요소에서 영감을 받아 시를 작성해주세요.",
-            "files": ["assets/sample-images/06-1.png", "assets/sample-images/06-2.png"],
-        }
-    ],
     [
         {
-            "text": "이미지의 시각적 요소를 토대로 짧은 악곡을 작곡해주세요.",
-            "files": [
-                "assets/sample-images/07-1.png",
-                "assets/sample-images/07-2.png",
-                "assets/sample-images/07-3.png",
-                "assets/sample-images/07-4.png",
-            ],
         }
-    ],
     [
         {
-            "text": "이 집에서 무슨 일이 있었을지 짧은 이야기를 지어보세요.",
-            "files": ["assets/sample-images/08.png"],
         }
-    ],
     [
         {
             "text": "이미지들의 순서를 바탕으로 짧은 이야기를 만들어 주세요.",
@@ -400,40 +558,33 @@ examples = [
     ],
     [
         {
-            "text": "이 세계에서 살고 있을 생물들을 상상해서 묘사해주세요.",
-            "files": ["assets/sample-images/10.png"],
         }
     ],
     [
         {
-            "text": "이미지에 적힌 텍스트를 읽어주세요.",
-            "files": ["assets/additional-examples/1.png"],
         }
-    ],
     [
         {
-            "text": "이 티켓은 언제 발급된 것이고, 가격은 얼마인가요?",
-            "files": ["assets/additional-examples/2.png"],
         }
     ],
     [
         {
             "text": "이미지에 있는 텍스트를 그대로 읽어서 마크다운 형태로 적어주세요.",
             "files": ["assets/additional-examples/3.png"],
         }
     ],
-    [
-        {
-            "text": "이 적분을 풀어주세요.",
-            "files": ["assets/additional-examples/4.png"],
-        }
-    ],
-    [
-        {
-            "text": "이 이미지를 간단히 캡션으로 설명해주세요.",
-            "files": ["assets/sample-images/01.png"],
-        }
-    ],
     [
         {
             "text": "이 표지판에는 무슨 문구가 적혀 있나요?",
@@ -446,54 +597,160 @@ examples = [
             "files": ["assets/sample-images/03.png"],
         }
     ],
-    [
-        {
-            "text": "이미지에 보이는 모든 사물과 그 색상을 나열해주세요.",
-            "files": ["assets/sample-images/04.png"],
-        }
-    ],
-    [
-        {
-            "text": "장면의 분위기를 묘사해주세요.",
-            "files": ["assets/sample-images/05.png"],
-        }
-    ],
 ]
-demo = gr.ChatInterface(
-    fn=run,
-    type="messages",
-    chatbot=gr.Chatbot(type="messages", scale=1, allow_tags=["image"]),
-    # .webp, .png, .jpg, .jpeg, .gif, .mp4, .csv, .txt, .pdf 모두 허용
-    textbox=gr.MultimodalTextbox(
-        file_types=[
-            ".webp", ".png", ".jpg", ".jpeg", ".gif",
-            ".mp4", ".csv", ".txt", ".pdf"
-        ],
-        file_count="multiple",
-        autofocus=True
-    ),
-    multimodal=True,
-    additional_inputs=[
-        gr.Textbox(
-            label="System Prompt",
-            value=(
-                "You are a deeply thoughtful AI. Consider problems thoroughly and derive "
-                "correct solutions through systematic reasoning. Please answer in korean."
             )
-        ),
-        gr.Slider(label="Max New Tokens", minimum=100, maximum=8000, step=50, value=2000),
-    ],
-    stop_btn=False,
-    title="Vidraft-Gemma-3-27B",
-    examples=examples,
-    run_examples_on_click=False,
-    cache_examples=False,
-    css_paths="style.css",
-    delete_cache=(1800, 1800),
-)
 if __name__ == "__main__":
     demo.launch()

 from collections.abc import Iterator
 from threading import Thread
+import requests  # <-- For SERPHouse web search
 import cv2
 import gradio as gr
 import spaces
 # PDF 텍스트 추출
 import PyPDF2
+##############################################################################
+# SERPHouse API key for web search
+##############################################################################
+SERPHOUSE_API_KEY = "V38CNn4HXpLtynJQyOeoUensTEYoFy8PBUxKpDqAW1pawT1vfJ2BWtPQ98h6"
+##############################################################################
+# Simple function to call the SERPHouse Live endpoint
+# https://api.serphouse.com/serp/live
+##############################################################################
+def do_web_search(query: str) -> str:
+    """
+    Calls SERPHouse live endpoint with the given query (q).
+    Returns a simple text summary or error message.
+    """
+    try:
+        url = "https://api.serphouse.com/serp/live"
+        params = {
+            "q": query,
+            "domain": "google.com",
+            "lang": "en",
+            "device": "desktop",
+            "serp_type": "web",
+            "api_token": SERPHOUSE_API_KEY,
+        }
+        resp = requests.get(url, params=params, timeout=30)
+        resp.raise_for_status()  # Raise an exception for 4xx/5xx errors
+        data = resp.json()
+        # For demonstration, let's extract top 3 organic results:
+        results = data.get("results", {})
+        organic = results.get("results", {}).get("organic", [])
+        if not organic:
+            return "No web search results found."
+        summary_lines = []
+        for item in organic[:3]:
+            rank = item.get("position", "-")
+            title = item.get("title", "No Title")
+            link = item.get("link", "No Link")
+            snippet = item.get("snippet", "(No snippet)")
+            summary_lines.append(f"**Rank {rank}:** [{title}]({link})\n\n> {snippet}")
+        return "\n\n".join(summary_lines) if summary_lines else "No web search results found."
+    except Exception as e:
+        logger.error(f"Web search failed: {e}")
+        return f"Web search failed: {str(e)}"
+MAX_CONTENT_CHARS = 4000  # 너무 큰 파일을 막기 위해 최대 표시 4000자
 model_id = os.getenv("MODEL_ID", "google/gemma-3-27b-it")
 processor = AutoProcessor.from_pretrained(model_id, padding_side="left")
     """
     try:
         df = pd.read_csv(path)
+        # 데이터 프레임 크기 제한 (행/열 수가 많은 경우)
+        if df.shape[0] > 50 or df.shape[1] > 10:
+            df = df.iloc[:50, :10]
         df_str = df.to_string()
         if len(df_str) > MAX_CONTENT_CHARS:
             df_str = df_str[:MAX_CONTENT_CHARS] + "\n...(truncated)..."
     try:
         with open(pdf_path, "rb") as f:
             reader = PyPDF2.PdfReader(f)
+            # 최대 5페이지만 처리
+            max_pages = min(5, len(reader.pages))
+            for page_num in range(max_pages):
+                page = reader.pages[page_num]
                 page_text = page.extract_text() or ""
                 page_text = page_text.strip()
                 if page_text:
+                    # 페이지별 텍스트도 제한
+                    if len(page_text) > MAX_CONTENT_CHARS // max_pages:
+                        page_text = page_text[:MAX_CONTENT_CHARS // max_pages] + "...(truncated)"
+                    text_chunks.append(f"## Page {page_num+1}\n\n{page_text}\n")
+            if len(reader.pages) > max_pages:
+                text_chunks.append(f"\n...(Showing {max_pages} of {len(reader.pages)} pages)...")
     except Exception as e:
         return f"Failed to read PDF ({os.path.basename(pdf_path)}): {str(e)}"
     for path in paths:
         if path.endswith(".mp4"):
             video_count += 1
+        elif re.search(r"\.(png|jpg|jpeg|gif|webp)$", path, re.IGNORECASE):
             image_count += 1
     return image_count, video_count
     for item in history:
         if item["role"] != "user" or isinstance(item["content"], str):
             continue
+        if isinstance(item["content"], list) and len(item["content"]) > 0:
+            file_path = item["content"][0]
+            if isinstance(file_path, str):
+                if file_path.endswith(".mp4"):
+                    video_count += 1
+                elif re.search(r"\.(png|jpg|jpeg|gif|webp)$", file_path, re.IGNORECASE):
+                    image_count += 1
     return image_count, video_count
     - <image> 태그가 있으면 태그 수와 실제 이미지 수 일치
     - CSV, TXT, PDF 등은 여기서 제한하지 않음
     """
+    # 이미지와 비디오 파일만 필터링
     media_files = []
     for f in message["files"]:
         if re.search(r"\.(png|jpg|jpeg|gif|webp)$", f, re.IGNORECASE) or f.endswith(".mp4"):
             media_files.append(f)
     if video_count == 0 and image_count > MAX_NUM_IMAGES:
         gr.Warning(f"You can upload up to {MAX_NUM_IMAGES} images.")
         return False
+    # 이미지 태그 검증 (실제 이미지 파일만 계산)
+    if "<image>" in message["text"]:
+        # 이미지 파일만 필터링
+        image_files = [f for f in message["files"] if re.search(r"\.(png|jpg|jpeg|gif|webp)$", f, re.IGNORECASE)]
+        image_tag_count = message["text"].count("<image>")
+        if image_tag_count != len(image_files):
+            gr.Warning("The number of <image> tags in the text does not match the number of image files.")
+            return False
     return True
     fps = vidcap.get(cv2.CAP_PROP_FPS)
     total_frames = int(vidcap.get(cv2.CAP_PROP_FRAME_COUNT))
+    # 더 적은 프레임을 추출하도록 조정
+    frame_interval = max(int(fps), int(total_frames / 10))  # 초당 1프레임 또는 최대 10프레임
     frames = []
     for i in range(0, total_frames, frame_interval):
             pil_image = Image.fromarray(image)
             timestamp = round(i / fps, 2)
             frames.append((pil_image, timestamp))
+            # 최대 5프레임만 사용
+            if len(frames) >= 5:
+                break
     vidcap.release()
     return frames
     parts = re.split(r"(<image>)", message["text"])
     content = []
     image_index = 0
+    # 이미지 파일만 필터링
+    image_files = [f for f in message["files"] if re.search(r"\.(png|jpg|jpeg|gif|webp)$", f, re.IGNORECASE)]
     for part in parts:
+        if part == "<image>" and image_index < len(image_files):
+            content.append({"type": "image", "url": image_files[image_index]})
             image_index += 1
         elif part.strip():
             content.append({"type": "text", "text": part.strip()})
 ##################################################
 # PDF + CSV + TXT + 이미지/비디오
 ##################################################
+def is_image_file(file_path: str) -> bool:
+    """이미지 파일인지 확인"""
+    return bool(re.search(r"\.(png|jpg|jpeg|gif|webp)$", file_path, re.IGNORECASE))
+def is_video_file(file_path: str) -> bool:
+    """비디오 파일인지 확인"""
+    return file_path.endswith(".mp4")
+def is_document_file(file_path: str) -> bool:
+    """문서 파일인지 확인 (PDF, CSV, TXT)"""
+    return (file_path.lower().endswith(".pdf") or
+            file_path.lower().endswith(".csv") or
+            file_path.lower().endswith(".txt"))
 def process_new_user_message(message: dict) -> list[dict]:
     if not message["files"]:
         return [{"type": "text", "text": message["text"]}]
     # 1) 파일 분류
+    video_files = [f for f in message["files"] if is_video_file(f)]
+    image_files = [f for f in message["files"] if is_image_file(f)]
     csv_files = [f for f in message["files"] if f.lower().endswith(".csv")]
     txt_files = [f for f in message["files"] if f.lower().endswith(".txt")]
     pdf_files = [f for f in message["files"] if f.lower().endswith(".pdf")]
         return content_list
     # 7) 이미지 처리
+    if "<image>" in message["text"] and image_files:
         # interleaved
+        interleaved_content = process_interleaved_images({"text": message["text"], "files": image_files})
+        # 원본 content_list 앞부분(텍스트)을 제거하고 interleaved로 대체
+        if content_list[0]["type"] == "text":
+            content_list = content_list[1:]  # 원본 텍스트 제거
+        return interleaved_content + content_list  # interleaved + 나머지 문서 분석 내용
     else:
         # 일반 여러 장
         for img_path in image_files:
             content = item["content"]
             if isinstance(content, str):
                 current_user_content.append({"type": "text", "text": content})
+            elif isinstance(content, list) and len(content) > 0:
+                file_path = content[0]
+                if is_image_file(file_path):
+                    current_user_content.append({"type": "image", "url": file_path})
+                else:
+                    # 비이미지 파일은 텍스트로 처리
+                    current_user_content.append({"type": "text", "text": f"[File: {os.path.basename(file_path)}]"})
+    # 마지막 사용자 메시지가 처리되지 않은 경우 추가
+    if current_user_content:
+        messages.append({"role": "user", "content": current_user_content})
     return messages
 # 메인 추론 함수
 ##################################################
 @spaces.GPU(duration=120)
+def run(
+    message: dict,
+    history: list[dict],
+    system_prompt: str = "",
+    max_new_tokens: int = 512,
+    use_web_search: bool = False,
+    web_search_query: str = "",
+) -> Iterator[str]:
+    """
+    The main inference function. Now extended with optional web_search arguments:
+    - use_web_search: bool
+    - web_search_query: str
+    If `use_web_search` is True, calls SERPHouse for the given `web_search_query`.
+    """
+    # Validate media constraints first
     if not validate_media_constraints(message, history):
         yield ""
         return
+    try:
+        # If user opted for "Web Search", do it here and yield a prefix message
+        if use_web_search and web_search_query.strip():
+            ws_result = do_web_search(web_search_query.strip())
+            yield f"**[Web Search Results for '{web_search_query.strip()}':]**\n\n{ws_result}\n\n---\n"
+        messages = []
+        if system_prompt:
+            messages.append({"role": "system", "content": [{"type": "text", "text": system_prompt}]})
+        messages.extend(process_history(history))
+        # 사용자 메시지 처리
+        user_content = process_new_user_message(message)
+        # 토큰 수를 줄이기 위해 너무 긴 텍스트는 잘라내기
+        for item in user_content:
+            if item["type"] == "text" and len(item["text"]) > MAX_CONTENT_CHARS:
+                item["text"] = item["text"][:MAX_CONTENT_CHARS] + "\n...(truncated)..."
+        messages.append({"role": "user", "content": user_content})
+        # 모델 입력 생성 전 최종 확인
+        for msg in messages:
+            if msg["role"] != "user":
+                continue
+            filtered_content = []
+            for item in msg["content"]:
+                if item["type"] == "image":
+                    if is_image_file(item["url"]):
+                        filtered_content.append(item)
+                    else:
+                        # 이미지 파일이 아닌 경우 텍스트로 변환
+                        filtered_content.append({
+                            "type": "text",
+                            "text": f"[Non-image file: {os.path.basename(item['url'])}]"
+                        })
+                else:
+                    filtered_content.append(item)
+            msg["content"] = filtered_content
+        # 모델 입력 생성
+        inputs = processor.apply_chat_template(
+            messages,
+            add_generation_prompt=True,
+            tokenize=True,
+            return_dict=True,
+            return_tensors="pt",
+        ).to(device=model.device, dtype=torch.bfloat16)
+        # 텍스트 생성 스트리머 설정
+        streamer = TextIteratorStreamer(processor, timeout=30.0, skip_prompt=True, skip_special_tokens=True)
+        gen_kwargs = dict(
+            inputs,
+            streamer=streamer,
+            max_new_tokens=max_new_tokens,
+        )
+        # 별도 스레드에서 텍스트 생성
+        t = Thread(target=model.generate, kwargs=gen_kwargs)
+        t.start()
+        # 결과 스트리밍
+        output = ""
+        for new_text in streamer:
+            output += new_text
+            yield output
+    except Exception as e:
+        logger.error(f"Error in run: {str(e)}")
+        yield f"죄송합니다. 오류가 발생했습니다: {str(e)}"
 ##################################################
 # 예시들 (한글화 버전)
 ##################################################
     [
         {
+            "text": "두 PDF 파일 내용을 비교하라.",
             "files": ["assets/additional-examples/pdf.pdf"],
+            "files": [
+                "assets/additional-examples/before.pdf",
+                "assets/additional-examples/after.pdf",
+            ],
         }
     ],
     [
     ],
     [
         {
+            "text": "이 영상의 내용을 설명하라",
+            "files": ["assets/additional-examples/tmp.mp4"],
         }
+    ],
     [
         {
+            "text": "표지 내용을 설명하고 글자를 읽어주세요.",
+            "files": ["assets/additional-examples/maz.jpg"],
         }
+    ],
     [
         {
             "text": "이미 이 영양제를 <image> 가지고 있고, 이 제품 <image>을 새로 사려 합니다. 함께 섭취할 때 주의해야 할 점이 있을까요?",
             "files": ["assets/additional-examples/pill1.png", "assets/additional-examples/pill2.png"],
         }
+    ],
     [
         {
+            "text": "이 적분을 풀어주세요.",
+            "files": ["assets/additional-examples/4.png"],
         }
+    ],
     [
         {
+            "text": "이 티켓은 언제 발급된 것이고, 가격은 얼마인가요?",
+            "files": ["assets/additional-examples/2.png"],
         }
+    ],
     [
         {
             "text": "이미지들의 순서를 바탕으로 짧은 이야기를 만들어 주세요.",
     ],
     [
         {
+            "text": "이미지의 시각적 요소에서 영감을 받아 시를 작성해주세요.",
+            "files": ["assets/sample-images/06-1.png", "assets/sample-images/06-2.png"],
         }
     ],
     [
         {
+            "text": "동일한 막대 그래프를 그리는 matplotlib 코드를 작성해주세요.",
+            "files": ["assets/additional-examples/barchart.png"],
         }
+    ],
     [
         {
+            "text": "이 세계에서 살고 있을 생물들을 상상해서 묘사해주세요.",
+            "files": ["assets/sample-images/08.png"],
         }
     ],
     [
         {
             "text": "이미지에 있는 텍스트를 그대로 읽어서 마크다운 형태로 적어주세요.",
             "files": ["assets/additional-examples/3.png"],
         }
     ],
     [
         {
             "text": "이 표지판에는 무슨 문구가 적혀 있나요?",
             "files": ["assets/sample-images/03.png"],
         }
     ],
 ]
+##############################################################################
+# Custom CSS similar to second example (colorful background, panel, etc.)
+##############################################################################
+css = """
+body {
+    background: linear-gradient(135deg, #667eea, #764ba2);
+    font-family: 'Helvetica Neue', Helvetica, Arial, sans-serif;
+    color: #333;
+    margin: 0;
+    padding: 0;
+}
+.gradio-container {
+    background: rgba(255, 255, 255, 0.95);
+    border-radius: 15px;
+    padding: 30px 40px;
+    box-shadow: 0 8px 30px rgba(0, 0, 0, 0.3);
+    margin: 40px auto;
+    max-width: 1200px;
+}
+.gradio-container h1 {
+    color: #333;
+    text-shadow: 1px 1px 2px rgba(0, 0, 0, 0.2);
+}
+.fillable {
+    width: 95% !important;
+    max-width: unset !important;
+}
+#examples_container {
+    margin: auto;
+    width: 90%;
+}
+#examples_row {
+    justify-content: center;
+}
+.sidebar {
+    background: rgba(255, 255, 255, 0.98);
+    border-radius: 10px;
+    padding: 20px;
+    box-shadow: 0 4px 15px rgba(0, 0, 0, 0.2);
+}
+button, .btn {
+    background: linear-gradient(90deg, #ff8a00, #e52e71);
+    border: none;
+    color: #fff;
+    padding: 12px 24px;
+    text-transform: uppercase;
+    font-weight: bold;
+    letter-spacing: 1px;
+    border-radius: 5px;
+    cursor: pointer;
+    transition: transform 0.2s ease-in-out;
+}
+button:hover, .btn:hover {
+    transform: scale(1.05);
+}
+"""
+title_html = """
+<h1 align="center" style="margin-bottom: 0.2em;"> 🤗 Vidraft-Gemma-3-27B </h1>
+<p align="center" style="font-size:1.1em; color:#555;">
+    Multimodal Chat Interface + Optional Web Search
+</p>
+"""
+##############################################################################
+# Build a Blocks layout that includes:
+#   - A left sidebar with "Web Search" controls
+#   - The main ChatInterface in the center or right
+##############################################################################
+with gr.Blocks(css=css, title="Vidraft-Gemma-3-27B") as demo:
+    gr.Markdown(title_html)
+    with gr.Row():
+        # Left Sidebar
+        with gr.Column(scale=3, variant="panel"):
+            gr.Markdown("### Menu / Options")
+            with gr.Row():
+                web_search_checkbox = gr.Checkbox(
+                    label="Web Search",
+                    value=False,
+                    info="Check to enable a SERPHouse web search before the chat reply"
+                )
+            web_search_text = gr.Textbox(
+                lines=1,
+                label="Web Search Query",
+                placeholder="Enter search keywords..."
+            )
+            gr.Markdown("---")
+            gr.Markdown("#### System Prompt")
+            system_prompt_box = gr.Textbox(
+                lines=3,
+                value=(
+                    "You are a deeply thoughtful AI. Consider problems thoroughly and derive "
+                    "correct solutions through systematic reasoning. Please answer in korean."
+                ),
+            )
+            max_tokens_slider = gr.Slider(
+                label="Max New Tokens",
+                minimum=100,
+                maximum=8000,
+                step=50,
+                value=2000,
+            )
+            gr.Markdown("<br><br>")  # spacing
+        # Main ChatInterface to the right
+        with gr.Column(scale=7):
+            chat = gr.ChatInterface(
+                fn=run,
+                type="messages",
+                chatbot=gr.Chatbot(type="messages", scale=1, allow_tags=["image"]),
+                textbox=gr.MultimodalTextbox(
+                    file_types=[
+                        ".webp", ".png", ".jpg", ".jpeg", ".gif",
+                        ".mp4", ".csv", ".txt", ".pdf"
+                    ],
+                    file_count="multiple",
+                    autofocus=True
+                ),
+                multimodal=True,
+                additional_inputs=[
+                    system_prompt_box,
+                    max_tokens_slider,
+                    web_search_checkbox,
+                    web_search_text,
+                ],
+                stop_btn=False,
+                title="Vidraft-Gemma-3-27B",
+                examples=examples,
+                run_examples_on_click=False,
+                cache_examples=False,
+                css_paths=None,
+                delete_cache=(1800, 1800),
+            )
+    with gr.Row(elem_id="examples_row"):
+        with gr.Column(scale=12, elem_id="examples_container"):
+            gr.Markdown("### Example Inputs (click to load)")
+            # The fix: pass an empty list to avoid the "None" error, so we keep the code structure.
+            gr.Examples(
+                examples=examples,
+                inputs=[],  # Instead of None or chat.
+                cache_examples=False
             )
 if __name__ == "__main__":
     demo.launch()