Spaces:

chalisesagun
/

deepseek-chat

Sleeping

chalisesagun commited on Dec 28, 2024

Commit

145163e

verified ·

1 Parent(s): 90af65d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,4 +1,5 @@
 import os
 import streamlit as st
 from langchain.document_loaders import PyPDFLoader
 from langchain.text_splitter import RecursiveCharacterTextSplitter
@@ -23,9 +24,18 @@ if api_key:
     if uploaded_file:
         # Load and process the document
         with st.spinner("Processing document..."):
-            loader = PyPDFLoader(uploaded_file)
             documents = loader.load()
             # Split the document into chunks
             text_splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=50)
             chunks = text_splitter.split_documents(documents)

 import os
+import tempfile
 import streamlit as st
 from langchain.document_loaders import PyPDFLoader
 from langchain.text_splitter import RecursiveCharacterTextSplitter
     if uploaded_file:
         # Load and process the document
         with st.spinner("Processing document..."):
+            # Save the uploaded file temporarily
+            with tempfile.NamedTemporaryFile(delete=False, suffix=".pdf") as tmp_file:
+                tmp_file.write(uploaded_file.getvalue())
+                tmp_file_path = tmp_file.name
+            # Use the temporary file path with PyPDFLoader
+            loader = PyPDFLoader(tmp_file_path)
             documents = loader.load()
+            # Remove the temporary file
+            os.unlink(tmp_file_path)
             # Split the document into chunks
             text_splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=50)
             chunks = text_splitter.split_documents(documents)