Spaces:

Mr-Vicky-01
/

chat-with-PDF

Running

App Files Files Community

Mr-Vicky-01 commited on Jul 25, 2024

Commit

030c076

verified ·

1 Parent(s): c0a1fe5

Update app.py

Browse files

Files changed (1) hide show

app.py +5 -19

app.py CHANGED Viewed

@@ -1,5 +1,4 @@
 import streamlit as st
-import pandas as pd
 from llama_index.core import StorageContext, load_index_from_storage, VectorStoreIndex, SimpleDirectoryReader, ChatPromptTemplate
 from llama_index.llms.huggingface import HuggingFaceInferenceAPI
 from llama_index.embeddings.huggingface import HuggingFaceEmbedding
@@ -32,20 +31,7 @@ os.makedirs(DATA_DIR, exist_ok=True)
 os.makedirs(PERSIST_DIR, exist_ok=True)
 def data_ingestion():
-    documents = []
-    # Load documents from the data directory
-    documents += SimpleDirectoryReader(DATA_DIR).load_data()
-    # Process and load CSV files
-    for file in os.listdir(DATA_DIR):
-        if file.endswith(".csv"):
-            csv_path = os.path.join(DATA_DIR, file)
-            df = pd.read_csv(csv_path)
-            # Convert DataFrame to a list of text strings (or any other format suitable for your embeddings)
-            csv_texts = df.apply(lambda row: " ".join(row.astype(str)), axis=1).tolist()
-            documents += csv_texts
     storage_context = StorageContext.from_defaults()
     index = VectorStoreIndex.from_documents(documents)
     index.storage_context.persist(persist_dir=PERSIST_DIR)
@@ -111,7 +97,7 @@ for message in st.session_state.messages:
 with st.sidebar:
     st.title("Menu:")
-    uploaded_file = st.file_uploader("Upload your PDF/CSV Files and Click on the Submit & Process Button")
     video_url = st.text_input("Enter Youtube Video Link: ")
     if st.button("Submit & Process"):
         with st.spinner("Processing..."):
@@ -119,7 +105,7 @@ with st.sidebar:
                 remove_old_files()
             if uploaded_file:
-                filepath = os.path.join("data", uploaded_file.name)
                 with open(filepath, "wb") as f:
                     f.write(uploaded_file.getbuffer())
@@ -128,10 +114,10 @@ with st.sidebar:
                 with open("data/saved_text.txt", "w") as file:
                     file.write(extracted_text)
-            data_ingestion()  # Process every time new file is uploaded
             st.success("Done")
-user_prompt = st.chat_input("Ask me anything about the content of the PDF/CSV:")
 if user_prompt and (uploaded_file or video_url):
     st.session_state.messages.append({'role': 'user', "content": user_prompt})

 import streamlit as st
 from llama_index.core import StorageContext, load_index_from_storage, VectorStoreIndex, SimpleDirectoryReader, ChatPromptTemplate
 from llama_index.llms.huggingface import HuggingFaceInferenceAPI
 from llama_index.embeddings.huggingface import HuggingFaceEmbedding
 os.makedirs(PERSIST_DIR, exist_ok=True)
 def data_ingestion():
+    documents = SimpleDirectoryReader(DATA_DIR).load_data()
     storage_context = StorageContext.from_defaults()
     index = VectorStoreIndex.from_documents(documents)
     index.storage_context.persist(persist_dir=PERSIST_DIR)
 with st.sidebar:
     st.title("Menu:")
+    uploaded_file = st.file_uploader("Upload your PDF Files and Click on the Submit & Process Button")
     video_url = st.text_input("Enter Youtube Video Link: ")
     if st.button("Submit & Process"):
         with st.spinner("Processing..."):
                 remove_old_files()
             if uploaded_file:
+                filepath = "data/saved_pdf.pdf"
                 with open(filepath, "wb") as f:
                     f.write(uploaded_file.getbuffer())
                 with open("data/saved_text.txt", "w") as file:
                     file.write(extracted_text)
+            data_ingestion()  # Process PDF every time new file is uploaded
             st.success("Done")
+user_prompt = st.chat_input("Ask me anything about the content of the PDF:")
 if user_prompt and (uploaded_file or video_url):
     st.session_state.messages.append({'role': 'user', "content": user_prompt})