Spaces:

eikarna
/

DeepChat

Running

App Files Files Community

eikarna commited on Feb 1

Commit

33009e3

1 Parent(s): d9760ae

Revert to non-RAG

Browse files

Files changed (1) hide show

app.py.bak +264 -0

app.py.bak ADDED Viewed

	@@ -0,0 +1,264 @@

+import streamlit as st
+import requests
+import logging
+import time
+from typing import Dict, Any, Optional, List
+import os
+from PIL import Image
+import pytesseract
+import fitz  # PyMuPDF
+from io import BytesIO
+import hashlib
+from sentence_transformers import SentenceTransformer
+import numpy as np
+from pathlib import Path
+import pickle
+import tempfile
+# Configure logging
+logging.basicConfig(
+    level=logging.INFO,
+    format='%(asctime)s - %(name)s - %(levelname)s - %(message)s'
+)
+logger = logging.getLogger(__name__)
+# Initialize SBERT model for embeddings
+@st.cache_resource
+def load_embedding_model():
+    return SentenceTransformer('all-MiniLM-L6-v2')
+# Modified Vector Store Class
+class SimpleVectorStore:
+    def __init__(self):
+        self.documents = []
+        self.embeddings = []
+    def add_document(self, text: str, embedding: np.ndarray):
+        self.documents.append(text)
+        self.embeddings.append(embedding)
+    def search(self, query_embedding: np.ndarray, top_k: int = 3) -> List[str]:
+        if not self.embeddings:
+            return []
+        similarities = np.dot(self.embeddings, query_embedding)
+        top_indices = np.argsort(similarities)[-top_k:][::-1]
+        return [self.documents[i] for i in top_indices]
+# Document processing functions
+def process_text(text: str) -> List[str]:
+    """Split text into chunks."""
+    # Simple splitting by sentences (can be improved with better chunking)
+    chunks = text.split('. ')
+    return [chunk + '.' for chunk in chunks if chunk]
+def process_image(image) -> str:
+    """Extract text from image using OCR."""
+    try:
+        text = pytesseract.image_to_string(image)
+        return text
+    except Exception as e:
+        logger.error(f"Error processing image: {str(e)}")
+        return ""
+def process_pdf(pdf_file) -> str:
+    """Extract text from PDF."""
+    try:
+        with tempfile.NamedTemporaryFile(delete=False) as tmp_file:
+            tmp_file.write(pdf_file.read())
+            tmp_file.flush()
+            doc = fitz.open(tmp_file.name)
+            text = ""
+            for page in doc:
+                text += page.get_text()
+            doc.close()
+            os.unlink(tmp_file.name)
+            return text
+    except Exception as e:
+        logger.error(f"Error processing PDF: {str(e)}")
+        return ""
+# Initialize session state
+if "messages" not in st.session_state:
+    st.session_state.messages = []
+if "request_timestamps" not in st.session_state:
+    st.session_state.request_timestamps = []
+if "vector_store" not in st.session_state:
+    st.session_state.vector_store = SimpleVectorStore()
+# Rate limiting configuration
+RATE_LIMIT_PERIOD = 60
+MAX_REQUESTS_PER_PERIOD = 30
+def check_rate_limit() -> bool:
+    """Check if we're within rate limits."""
+    current_time = time.time()
+    st.session_state.request_timestamps = [
+        ts for ts in st.session_state.request_timestamps
+        if current_time - ts < RATE_LIMIT_PERIOD
+    ]
+    if len(st.session_state.request_timestamps) >= MAX_REQUESTS_PER_PERIOD:
+        return False
+    st.session_state.request_timestamps.append(current_time)
+    return True
+def query(payload: Dict[str, Any], api_url: str) -> Optional[Dict[str, Any]]:
+    """Query the Hugging Face API with error handling and rate limiting."""
+    if not check_rate_limit():
+        raise Exception(f"Rate limit exceeded. Please wait {RATE_LIMIT_PERIOD} seconds.")
+    try:
+        headers = {"Authorization": f"Bearer {st.secrets['HF_TOKEN']}"}
+        response = requests.post(api_url, headers=headers, json=payload, timeout=30)
+        if response.status_code == 429:
+            raise Exception("Too many requests. Please try again later.")
+        response.raise_for_status()
+        print(response.request.url)
+        print(response.request.headers)
+        print(response.request.body)
+        print(response)
+        return response.json()
+    except requests.exceptions.JSONDecodeError as e:
+        logger.error(f"API request failed: {str(e)}")
+        raise
+# Enhanced response validation
+def process_response(response: Dict[str, Any]) -> str:
+    if not isinstance(response, list) or not response:
+        raise ValueError("Invalid response format")
+    if 'generated_text' not in response[0]:
+        raise ValueError("Unexpected response structure")
+    text = response[0]['generated_text'].strip()
+# Page configuration
+st.set_page_config(
+    page_title="RAG-Enabled DeepSeek Chatbot",
+    page_icon="🤖",
+    layout="wide"
+)
+# Sidebar configuration
+with st.sidebar:
+    st.header("Model Configuration")
+    st.markdown("[Get HuggingFace Token](https://huggingface.co/settings/tokens)")
+    model_options = [
+        "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B",
+    ]
+    selected_model = st.selectbox("Select Model", model_options, index=0)
+    system_message = st.text_area(
+        "System Message",
+        value="You are a friendly chatbot with RAG capabilities. Use the provided context to answer questions accurately. If the context doesn't contain relevant information, say so.",
+        height=100
+    )
+    max_tokens = st.slider("Max Tokens", 10, 4000, 100)
+    temperature = st.slider("Temperature", 0.1, 4.0, 0.3)
+    top_p = st.slider("Top-p", 0.1, 1.0, 0.6)
+    # File upload section
+    st.header("Upload Knowledge Base")
+    uploaded_files = st.file_uploader(
+        "Upload files (PDF, Images, Text)",
+        type=['pdf', 'png', 'jpg', 'jpeg', 'txt'],
+        accept_multiple_files=True
+    )
+# Process uploaded files
+if uploaded_files:
+    embedding_model = load_embedding_model()
+    for file in uploaded_files:
+        try:
+            if file.type == "application/pdf":
+                text = process_pdf(file)
+            elif file.type.startswith("image/"):
+                image = Image.open(file)
+                text = process_image(image)
+            else:  # text files
+                text = file.getvalue().decode()
+            chunks = process_text(text)
+            for chunk in chunks:
+                embedding = embedding_model.encode(chunk)
+                st.session_state.vector_store.add_document(chunk, embedding)
+            st.sidebar.success(f"Successfully processed {file.name}")
+        except Exception as e:
+            st.sidebar.error(f"Error processing {file.name}: {str(e)}")
+# Main chat interface
+st.title("🤖 RAG-Enabled DeepSeek Chatbot")
+st.caption("Upload documents in the sidebar to enhance the chatbot's knowledge")
+# Display chat history
+for message in st.session_state.messages:
+    with st.chat_message(message["role"]):
+        st.markdown(message["content"])
+# Handle user input
+if prompt := st.chat_input("Type your message..."):
+    # Display user message
+    st.session_state.messages.append({"role": "user", "content": prompt})
+    with st.chat_message("user"):
+        st.markdown(prompt)
+    try:
+        with st.spinner("Generating response..."):
+            embedding_model = load_embedding_model()
+            query_embedding = embedding_model.encode(prompt)
+            relevant_contexts = st.session_state.vector_store.search(query_embedding)
+            # Dynamic context handling
+            context_text = "\n".join(relevant_contexts) if relevant_contexts else ""
+            system_msg = (
+                f"{system_message} Use the provided context to answer accurately."
+                if context_text
+                else system_message
+            )
+            # Format for DeepSeek model
+            full_prompt = f"""<|beginofutterance|>System: {system_msg}
+{context_text if context_text else ''}
+<|endofutterance|>
+<|beginofutterance|>User: {prompt}<|endofutterance|>
+<|beginofutterance|>Assistant:"""
+            payload = {
+                "inputs": full_prompt,
+                "parameters": {
+                    "max_new_tokens": max_tokens,
+                    "temperature": temperature,
+                    "top_p": top_p,
+                    "return_full_text": False
+                }
+            }
+            api_url = f"https://api-inference.huggingface.co/models/{selected_model}"
+            # Get and process response
+            output = query(payload, api_url)
+            if output:
+                response_text = process_response(output)
+                # Display assistant response
+                with st.chat_message("assistant"):
+                    st.markdown(response_text)
+                # Update chat history
+                st.session_state.messages.append({
+                    "role": "assistant",
+                    "content": response_text
+                })
+    except Exception as e:
+        logger.error(f"Error: {str(e)}", exc_info=True)
+        st.error(f"Error: {str(e)}")