Spaces:

sagar007
/

DeepSeekR1_Search

Running on Zero

App Files Files Community

sagar007 commited on Feb 22

Commit

60c475d

verified ·

1 Parent(s): c908926

Update app.py

Browse files

Files changed (1) hide show

app.py +187 -454

app.py CHANGED Viewed

@@ -1,513 +1,246 @@
 import gradio as gr
-from transformers import AutoModelForCausalLM, AutoTokenizer
-import spaces
 from duckduckgo_search import DDGS
-import time
-import torch
 from datetime import datetime
-import os
-import subprocess
-import numpy as np
-from typing import List, Dict, Tuple, Any
-# Install required dependencies for Kokoro with better error handling
-try:
-    subprocess.run(['git', 'lfs', 'install'], check=True)
-    if not os.path.exists('Kokoro-82M'):
-        subprocess.run(['git', 'clone', 'https://huggingface.co/hexgrad/Kokoro-82M'], check=True)
-    # Try installing espeak with proper package manager commands
-    try:
-        subprocess.run(['apt-get', 'update'], check=True)
-        subprocess.run(['apt-get', 'install', '-y', 'espeak'], check=True)
-    except subprocess.CalledProcessError:
-        print("Warning: Could not install espeak. Attempting espeak-ng...")
-        try:
-            subprocess.run(['apt-get', 'install', '-y', 'espeak-ng'], check=True)
-        except subprocess.CalledProcessError:
-            print("Warning: Could not install espeak or espeak-ng. TTS functionality may be limited.")
-except Exception as e:
-    print(f"Warning: Initial setup error: {str(e)}")
-    print("Continuing with limited functionality...")
-# --- Initialization (Do this ONCE) ---
-model_name = "deepseek-ai/DeepSeek-R1-Distill-Llama-8B"
-tokenizer = AutoTokenizer.from_pretrained(model_name)
-tokenizer.pad_token = tokenizer.eos_token
-# Initialize DeepSeek model
-model = AutoModelForCausalLM.from_pretrained(
-    model_name,
-    device_map="auto",
-    offload_folder="offload",
-    low_cpu_mem_usage=True,
-    torch_dtype=torch.float16
-)
-# Initialize Kokoro TTS (with error handling)
-VOICE_CHOICES = {
-    '🇺🇸 Female (Default)': 'af',
-    '🇺🇸 Bella': 'af_bella',
-    '🇺🇸 Sarah': 'af_sarah',
-    '🇺🇸 Nicole': 'af_nicole'
-}
-TTS_ENABLED = False
-TTS_MODEL = None
-VOICEPACK = None
-try:
-    if os.path.exists('Kokoro-82M'):
-        import sys
-        sys.path.append('Kokoro-82M')
-        from models import build_model  # type: ignore
-        from kokoro import generate  # type: ignore
-        device = 'cuda' if torch.cuda.is_available() else 'cpu'
-        TTS_MODEL = build_model('Kokoro-82M/kokoro-v0_19.pth', device)
-        # Load default voice
-        try:
-            VOICEPACK = torch.load('Kokoro-82M/voices/af.pt', map_location=device, weights_only=True)
-        except Exception as e:
-            print(f"Warning: Could not load default voice: {e}")
-            raise
-        TTS_ENABLED = True
-    else:
-        print("Warning: Kokoro-82M directory not found. TTS disabled.")
-except Exception as e:
-    print(f"Warning: Could not initialize Kokoro TTS: {str(e)}")
-    TTS_ENABLED = False
-def get_web_results(query: str, max_results: int = 5) -> List[Dict[str, str]]:
-    """Get web search results using DuckDuckGo"""
     try:
         with DDGS() as ddgs:
-            results = list(ddgs.text(query, max_results=max_results))
-            return [{
-                "title": result.get("title", ""),
-                "snippet": result["body"],
-                "url": result["href"],
-                "date": result.get("published", "")
-            } for result in results]
     except Exception as e:
-        print(f"Error in web search: {e}")
-        return []
-def format_prompt(query: str, context: List[Dict[str, str]]) -> str:
-    """Format the prompt with web context"""
     current_time = datetime.now().strftime("%Y-%m-%d %H:%M:%S")
-    context_lines = '\n'.join([f'- [{res["title"]}]: {res["snippet"]}' for res in context])
-    return f"""You are an intelligent search assistant. Answer the user's query using the provided web context.
-Current Time: {current_time}
-Important: For election-related queries, please distinguish clearly between different election years and types (presidential vs. non-presidential). Only use information from the provided web context.
 Query: {query}
 Web Context:
-{context_lines}
-Provide a detailed answer in markdown format. Include relevant information from sources and cite them using [1], [2], etc. If the query is about elections, clearly specify which year and type of election you're discussing.
-Answer:"""
-def format_sources(web_results: List[Dict[str, str]]) -> str:
-    """Format sources with more details"""
     if not web_results:
-        return "<div class='no-sources'>No sources available</div>"
-    sources_html = "<div class='sources-container'>"
     for i, res in enumerate(web_results, 1):
-        title = res["title"] or "Source"
-        date = f"<span class='source-date'>{res['date']}</span>" if res['date'] else ""
         sources_html += f"""
         <div class='source-item'>
-            <div class='source-number'>[{i}]</div>
-            <div class='source-content'>
-                <a href="{res['url']}" target="_blank" class='source-title'>{title}</a>
-                {date}
-                <div class='source-snippet'>{res['snippet'][:150]}...</div>
-            </div>
         </div>
         """
     sources_html += "</div>"
     return sources_html
-@spaces.GPU(duration=30)
-def generate_answer(prompt: str) -> str:
-    """Generate answer using the DeepSeek model"""
-    inputs = tokenizer(
-        prompt,
-        return_tensors="pt",
-        padding=True,
-        truncation=True,
-        max_length=512,
-        return_attention_mask=True
-    ).to(model.device)
-    outputs = model.generate(
-        inputs.input_ids,
-        attention_mask=inputs.attention_mask,
-        max_new_tokens=256,
-        temperature=0.7,
-        top_p=0.95,
-        pad_token_id=tokenizer.eos_token_id,
-        do_sample=True,
-        early_stopping=True
-    )
-    return tokenizer.decode(outputs[0], skip_special_tokens=True)
-@spaces.GPU(duration=30)
-def generate_speech_with_gpu(text: str, voice_name: str = 'af', tts_model=TTS_MODEL, voicepack=VOICEPACK) -> Tuple[int, np.ndarray] | None:
-    """Generate speech from text using Kokoro TTS model."""
-    if not TTS_ENABLED or tts_model is None:
-        print("TTS is not enabled or model is not loaded.")
-        return None
-    try:
-        device = 'cuda' if torch.cuda.is_available() else 'cpu'
-        # Handle voicepack loading
-        voice_file = f'Kokoro-82M/voices/{voice_name}.pt'
-        if voice_name == 'af' and voicepack is not None:
-            # Use the pre-loaded default voicepack
-            pass
-        elif os.path.exists(voice_file):
-            # Load the selected voicepack if it exists
-            voicepack = torch.load(voice_file, map_location=device, weights_only=True)
-        else:
-            # Fall back to default 'af' if selected voicepack is missing
-            print(f"Voicepack {voice_name}.pt not found. Falling back to default 'af'.")
-            voice_file = 'Kokoro-82M/voices/af.pt'
-            if os.path.exists(voice_file):
-                voicepack = torch.load(voice_file, map_location=device, weights_only=True)
-            else:
-                print("Default voicepack 'af.pt' not found. Cannot generate audio.")
-                return None
-        # Clean the text
-        clean_text = ' '.join([line for line in text.split('\n') if not line.startswith('#')])
-        clean_text = clean_text.replace('[', '').replace(']', '').replace('*', '')
-        # Split long text into chunks
-        max_chars = 1000
-        chunks = []
-        if len(clean_text) > max_chars:
-            sentences = clean_text.split('.')
-            current_chunk = ""
-            for sentence in sentences:
-                if len(current_chunk) + len(sentence) + 1 < max_chars:
-                    current_chunk += sentence + "."
-                else:
-                    chunks.append(current_chunk.strip())
-                    current_chunk = sentence + "."
-            if current_chunk:
-                chunks.append(current_chunk.strip())
-        else:
-            chunks = [clean_text]
-        # Generate audio for each chunk
-        audio_chunks = []
-        for chunk in chunks:
-            if chunk.strip():
-                chunk_audio, _ = generate(tts_model, chunk, voicepack, lang='a')
-                if isinstance(chunk_audio, torch.Tensor):
-                    chunk_audio = chunk_audio.cpu().numpy()
-                audio_chunks.append(chunk_audio)
-        # Concatenate chunks
-        if audio_chunks:
-            final_audio = np.concatenate(audio_chunks) if len(audio_chunks) > 1 else audio_chunks[0]
-            return (24000, final_audio)
-        else:
-            return None
-    except Exception as e:
-        print(f"Error generating speech: {str(e)}")
-        return None
-def process_query(query: str, history: List[List[str]], selected_voice: str = 'af'):
-    """Process user query with streaming effect"""
-    try:
-        if history is None:
-            history = []
-        # Get web results first
-        web_results = get_web_results(query)
-        sources_html = format_sources(web_results)
-        current_history = history + [[query, "*Searching...*"]]
-        # Yield initial searching state
-        yield (
-            "*Searching & Thinking...*",  # answer_output (Markdown)
-            sources_html,                  # sources_output (HTML)
-            "Searching...",               # search_btn (Button)
-            current_history,              # chat_history_display (Chatbot)
-            None                          # audio_output (Audio)
-        )
-        # Generate answer
-        prompt = format_prompt(query, web_results)
-        answer = generate_answer(prompt)
-        final_answer = answer.split("Answer:")[-1].strip()
-        # Update history before TTS
-        updated_history = history + [[query, final_answer]]
-        # Generate speech from the answer (only if enabled)
-        if TTS_ENABLED:
-            yield (
-                final_answer,              # answer_output
-                sources_html,              # sources_output
-                "Generating audio...",     # search_btn
-                updated_history,           # chat_history_display
-                None                       # audio_output
-            )
-            try:
-                audio = generate_speech_with_gpu(final_answer, selected_voice)
-                if audio is None:
-                    final_answer += "\n\n*Audio generation failed. The voicepack may be missing or incompatible.*"
-            except Exception as e:
-                final_answer += f"\n\n*Error generating audio: {str(e)}*"
-                audio = None
-        else:
-            final_answer += "\n\n*TTS is disabled. Audio not available.*"
-            audio = None
-        # Yield final result
-        yield (
-            final_answer,              # answer_output
-            sources_html,              # sources_output
-            "Search",                  # search_btn
-            updated_history,           # chat_history_display
-            audio if audio is not None else None  # audio_output
-        )
-    except Exception as e:
-        error_message = str(e)
-        if "GPU quota" in error_message:
-            error_message = "⚠️ GPU quota exceeded. Please try again later when the daily quota resets."
-        yield (
-            f"Error: {error_message}",  # answer_output
-            sources_html,               # sources_output
-            "Search",                   # search_btn
-            history + [[query, f"*Error: {error_message}*"]],  # chat_history_display
-            None                        # audio_output
-        )
-# Update the CSS for better contrast and readability
 css = """
 .gradio-container {
-    max-width: 1200px !important;
-    background-color: #f7f7f8 !important;
 }
-#header {
     text-align: center;
-    margin-bottom: 2rem;
-    padding: 2rem 0;
-    background: #1a1b1e;
-    border-radius: 12px;
-    color: white;
-}
-#header h1 {
-    color: white;
-    font-size: 2.5rem;
-    margin-bottom: 0.5rem;
 }
-#header h3 {
-    color: #a8a9ab;
 }
-.search-container {
-    background: #1a1b1e;
-    border-radius: 12px;
-    box-shadow: 0 4px 12px rgba(0,0,0,0.1);
-    padding: 1rem;
-    margin-bottom: 1rem;
 }
 .search-box {
-    padding: 1rem;
-    background: #2c2d30;
-    border-radius: 8px;
-    margin-bottom: 1rem;
-}
-.search-box input[type="text"] {
-    background: #3a3b3e !important;
-    border: 1px solid #4a4b4e !important;
-    color: white !important;
-    border-radius: 8px !important;
-}
-.search-box input[type="text"]::placeholder {
-    color: #a8a9ab !important;
 }
 .search-box button {
-    background: #2563eb !important;
     border: none !important;
 }
 .results-container {
-    background: #2c2d30;
-    border-radius: 8px;
-    padding: 1rem;
-    margin-top: 1rem;
 }
 .answer-box {
-    background: #3a3b3e;
-    border-radius: 8px;
-    padding: 1.5rem;
-    color: white;
-    margin-bottom: 1rem;
-}
-.answer-box p {
-    color: #e5e7eb;
     line-height: 1.6;
 }
-.sources-container {
-    margin-top: 1rem;
-    background: #2c2d30;
-    border-radius: 8px;
-    padding: 1rem;
 }
 .source-item {
-    display: flex;
-    padding: 12px;
-    margin: 8px 0;
-    background: #3a3b3e;
-    border-radius: 8px;
-    transition: all 0.2s;
-}
-.source-item:hover {
-    background: #4a4b4e;
 }
 .source-number {
     font-weight: bold;
-    margin-right: 12px;
-    color: #60a5fa;
-}
-.source-content {
-    flex: 1;
 }
-.source-title {
-    color: #60a5fa;
-    font-weight: 500;
     text-decoration: none;
-    display: block;
-    margin-bottom: 4px;
-}
-.source-date {
-    color: #a8a9ab;
-    font-size: 0.9em;
-    margin-left: 8px;
 }
-.source-snippet {
-    color: #e5e7eb;
-    font-size: 0.9em;
-    line-height: 1.4;
 }
-.chat-history {
-    max-height: 400px;
     overflow-y: auto;
-    padding: 1rem;
-    background: #2c2d30;
-    border-radius: 8px;
-    margin-top: 1rem;
-}
-.examples-container {
-    background: #2c2d30;
-    border-radius: 8px;
-    padding: 1rem;
-    margin-top: 1rem;
-}
-.examples-container button {
-    background: #3a3b3e !important;
-    border: 1px solid #4a4b4e !important;
-    color: #e5e7eb !important;
-}
-.markdown-content {
-    color: #e5e7eb !important;
-}
-.markdown-content h1, .markdown-content h2, .markdown-content h3 {
-    color: white !important;
-}
-.markdown-content a {
-    color: #60a5fa !important;
-}
-.accordion {
-    background: #2c2d30 !important;
-    border-radius: 8px !important;
-    margin-top: 1rem !important;
-}
-.voice-selector {
-    margin-top: 1rem;
-    background: #2c2d30;
-    border-radius: 8px;
-    padding: 0.5rem;
-}
-.voice-selector select {
-    background: #3a3b3e !important;
-    color: white !important;
-    border: 1px solid #4a4b4e !important;
 }
 """
-# Update the Gradio interface layout
-with gr.Blocks(title="AI Search Assistant", css=css, theme="dark") as demo:
-    chat_history = gr.State([])
-    with gr.Column(elem_id="header"):
-        gr.Markdown("# 🔍 AI Search Assistant")
-        gr.Markdown("### Powered by DeepSeek & Real-time Web Results with Voice")
-    with gr.Column(elem_classes="search-container"):
-        with gr.Row(elem_classes="search-box"):
-            search_input = gr.Textbox(
-                label="",
-                placeholder="Ask anything...",
-                scale=5,
-                container=False
-            )
-            search_btn = gr.Button("Search", variant="primary", scale=1)
-            voice_select = gr.Dropdown(
-                choices=list(VOICE_CHOICES.items()),
-                value='af',
-                label="Select Voice",
-                elem_classes="voice-selector"
-            )
-        with gr.Row(elem_classes="results-container"):
-            with gr.Column(scale=2):
-                with gr.Column(elem_classes="answer-box"):
-                    answer_output = gr.Markdown(elem_classes="markdown-content")
-                    with gr.Row():
-                        audio_output = gr.Audio(label="Voice Response", elem_classes="audio-player")
-                with gr.Accordion("Chat History", open=False, elem_classes="accordion"):
-                    chat_history_display = gr.Chatbot(elem_classes="chat-history")
-            with gr.Column(scale=1):
-                with gr.Column(elem_classes="sources-box"):
-                    gr.Markdown("### Sources")
-                    sources_output = gr.HTML()
-        with gr.Row(elem_classes="examples-container"):
-            gr.Examples(
-                examples=[
-                    "musk explores blockchain for doge",
-                    "nvidia to launch new gaming card",
-                    "What are the best practices for sustainable living?",
-                    "tesla mistaken for asteroid"
-                ],
-                inputs=search_input,
-                label="Try these examples"
-            )
-    # Handle interactions
     search_btn.click(
-        fn=process_query,
-        inputs=[search_input, chat_history, voice_select],
-        outputs=[answer_output, sources_output, search_btn, chat_history_display, audio_output]
     )
-    # Also trigger search on Enter key
     search_input.submit(
-        fn=process_query,
-        inputs=[search_input, chat_history, voice_select],
-        outputs=[answer_output, sources_output, search_btn, chat_history_display, audio_output]
     )
 if __name__ == "__main__":
-    demo.launch(share=True)

 import gradio as gr
+from transformers import pipeline
 from duckduckgo_search import DDGS
 from datetime import datetime
+import asyncio
+# Initialize a lightweight text generation model (distilgpt2 for speed)
+generator = pipeline("text-generation", model="distilgpt2", device=0 if gr.cuda.is_available() else -1)
+# Web search function using DuckDuckGo
+async def get_web_results(query: str, max_results: int = 5) -> list:
+    """Fetch web results asynchronously for deep research."""
     try:
         with DDGS() as ddgs:
+            results = await asyncio.to_thread(lambda: list(ddgs.text(query, max_results=max_results)))
+            return [
+                {"title": r.get("title", "No Title"), "snippet": r["body"], "url": r["href"]}
+                for r in results
+            ]
     except Exception as e:
+        return [{"title": "Error", "snippet": f"Failed to fetch results: {str(e)}", "url": "#"}]
+# Format prompt for the AI model
+def format_prompt(query: str, web_results: list) -> str:
+    """Create a concise prompt with web context."""
     current_time = datetime.now().strftime("%Y-%m-%d %H:%M:%S")
+    context = "\n".join([f"- {r['title']}: {r['snippet']}" for r in web_results])
+    return f"""Time: {current_time}
 Query: {query}
 Web Context:
+{context}
+Provide a detailed, well-structured answer in markdown format with citations [1], [2], etc."""
+# Generate answer using the AI model
+def generate_answer(prompt: str) -> str:
+    """Generate a detailed research answer."""
+    response = generator(prompt, max_length=300, num_return_sequences=1, truncation=True)[0]["generated_text"]
+    # Extract the answer after the prompt
+    answer_start = response.find("Provide a detailed") + len("Provide a detailed, well-structured answer in markdown format with citations [1], [2], etc.")
+    return response[answer_start:].strip()
+# Format sources for display
+def format_sources(web_results: list) -> str:
+    """Create an HTML list of sources."""
     if not web_results:
+        return "<div>No sources available</div>"
+    sources_html = "<div class='sources-list'>"
     for i, res in enumerate(web_results, 1):
         sources_html += f"""
         <div class='source-item'>
+            <span class='source-number'>[{i}]</span>
+            <a href='{res['url']}' target='_blank'>{res['title']}</a>: {res['snippet'][:150]}...
         </div>
         """
     sources_html += "</div>"
     return sources_html
+# Main processing function
+async def process_deep_research(query: str, history: list):
+    """Handle the deep research process with progressive updates."""
+    if not history:
+        history = []
+    # Step 1: Initial loading state
+    yield {
+        "answer": "*Searching the web...*",
+        "sources": "<div>Fetching sources...</div>",
+        "history": history + [[query, "*Searching...*"]]
+    }
+    # Step 2: Fetch web results
+    web_results = await get_web_results(query)
+    sources_html = format_sources(web_results)
+    # Step 3: Update with web search completed
+    yield {
+        "answer": "*Analyzing results...*",
+        "sources": sources_html,
+        "history": history + [[query, "*Analyzing...*"]]
+    }
+    # Step 4: Generate detailed answer
+    prompt = format_prompt(query, web_results)
+    answer = generate_answer(prompt)
+    final_history = history + [[query, answer]]
+    # Step 5: Final result
+    yield {
+        "answer": answer,
+        "sources": sources_html,
+        "history": final_history
+    }
+# Custom CSS for a cool, modern UI
 css = """
+body {
+    font-family: 'Arial', sans-serif;
+    background: #1a1a1a;
+    color: #ffffff;
+}
 .gradio-container {
+    max-width: 1000px;
+    margin: 0 auto;
+    padding: 20px;
 }
+.header {
     text-align: center;
+    padding: 20px;
+    background: linear-gradient(135deg, #2c3e50, #3498db);
+    border-radius: 10px;
+    margin-bottom: 20px;
 }
+.header h1 {
+    font-size: 2.5em;
+    margin: 0;
+    color: #ffffff;
 }
+.header p {
+    color: #bdc3c7;
+    font-size: 1.1em;
 }
 .search-box {
+    background: #2c2c2c;
+    padding: 15px;
+    border-radius: 10px;
+    box-shadow: 0 4px 10px rgba(0, 0, 0, 0.3);
+}
+.search-box input {
+    background: #3a3a3a !important;
+    color: #ffffff !important;
+    border: none !important;
+    border-radius: 5px !important;
 }
 .search-box button {
+    background: #3498db !important;
     border: none !important;
+    border-radius: 5px !important;
+    transition: background 0.3s;
+}
+.search-box button:hover {
+    background: #2980b9 !important;
 }
 .results-container {
+    margin-top: 20px;
+    display: flex;
+    gap: 20px;
 }
 .answer-box {
+    flex: 2;
+    background: #2c2c2c;
+    padding: 20px;
+    border-radius: 10px;
+    box-shadow: 0 4px 10px rgba(0, 0, 0, 0.3);
+}
+.answer-box .markdown {
+    color: #ecf0f1;
     line-height: 1.6;
 }
+.sources-list {
+    flex: 1;
+    background: #2c2c2c;
+    padding: 15px;
+    border-radius: 10px;
+    box-shadow: 0 4px 10px rgba(0, 0, 0, 0.3);
 }
 .source-item {
+    margin-bottom: 10px;
 }
 .source-number {
+    color: #3498db;
     font-weight: bold;
+    margin-right: 5px;
 }
+.source-item a {
+    color: #3498db;
     text-decoration: none;
 }
+.source-item a:hover {
+    text-decoration: underline;
 }
+.history-box {
+    margin-top: 20px;
+    background: #2c2c2c;
+    padding: 15px;
+    border-radius: 10px;
+    max-height: 300px;
     overflow-y: auto;
+    box-shadow: 0 4px 10px rgba(0, 0, 0, 0.3);
 }
 """
+# Gradio app setup with Blocks for better control
+with gr.Blocks(title="Deep Research Engine", css=css) as demo:
+    history_state = gr.State([])
+    # Header
+    with gr.Column(elem_classes="header"):
+        gr.Markdown("# Deep Research Engine")
+        gr.Markdown("Your gateway to in-depth answers with real-time web insights.")
+    # Search input and button
+    with gr.Row(elem_classes="search-box"):
+        search_input = gr.Textbox(label="", placeholder="Ask anything...", lines=2)
+        search_btn = gr.Button("Research", variant="primary")
+    # Results layout
+    with gr.Row(elem_classes="results-container"):
+        with gr.Column():
+            answer_output = gr.Markdown(label="Research Findings", elem_classes="answer-box")
+        with gr.Column():
+            sources_output = gr.HTML(label="Sources", elem_classes="sources-list")
+    # Chat history
+    with gr.Row():
+        history_display = gr.Chatbot(label="History", elem_classes="history-box")
+    # Event handling
+    async def handle_search(query, history):
+        async for step in process_deep_research(query, history):
+            yield step["answer"], step["sources"], step["history"]
     search_btn.click(
+        fn=handle_search,
+        inputs=[search_input, history_state],
+        outputs=[answer_output, sources_output, history_display],
+        _js="() => [document.querySelector('.search-box input').value, null]"  # Ensure history is managed
+    ).then(
+        fn=lambda x: x,
+        inputs=[history_display],
+        outputs=[history_state]
     )
     search_input.submit(
+        fn=handle_search,
+        inputs=[search_input, history_state],
+        outputs=[answer_output, sources_output, history_display]
+    ).then(
+        fn=lambda x: x,
+        inputs=[history_display],
+        outputs=[history_state]
     )
+# Launch the app
 if __name__ == "__main__":
+    demo.launch()