Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -50,19 +50,20 @@ api_key = os.getenv("OPENAI_API_KEY")
|
|
50 |
|
51 |
|
52 |
|
53 |
-
# Updated
|
54 |
-
@st.cache_data(persist="disk")
|
55 |
def load_vector_store(file_path, store_name, force_reload=False):
|
56 |
-
|
|
|
57 |
|
58 |
# Check if vector store already exists and force_reload is False
|
59 |
if not force_reload and os.path.exists(vector_store_path):
|
60 |
with open(vector_store_path, "rb") as f:
|
61 |
VectorStore = pickle.load(f)
|
|
|
62 |
else:
|
63 |
# Load and process the PDF, then create the vector store
|
64 |
-
text_splitter = RecursiveCharacterTextSplitter(
|
65 |
-
chunk_size=1000, chunk_overlap=200, length_function=len)
|
66 |
text = load_pdf_text(file_path)
|
67 |
chunks = text_splitter.split_text(text=text)
|
68 |
embeddings = OpenAIEmbeddings()
|
@@ -71,11 +72,23 @@ def load_vector_store(file_path, store_name, force_reload=False):
|
|
71 |
# Serialize the vector store
|
72 |
with open(vector_store_path, "wb") as f:
|
73 |
pickle.dump(VectorStore, f)
|
|
|
74 |
|
75 |
-
#
|
76 |
-
|
77 |
-
|
78 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
79 |
|
80 |
return VectorStore
|
81 |
|
|
|
50 |
|
51 |
|
52 |
|
53 |
+
# Updated load_vector_store function with Streamlit text outputs and directory handling for Git
|
54 |
+
@st.cache_data(persist="disk")
|
55 |
def load_vector_store(file_path, store_name, force_reload=False):
|
56 |
+
local_repo_path = "Private_Book"
|
57 |
+
vector_store_path = os.path.join(local_repo_path, f"{store_name}.pkl")
|
58 |
|
59 |
# Check if vector store already exists and force_reload is False
|
60 |
if not force_reload and os.path.exists(vector_store_path):
|
61 |
with open(vector_store_path, "rb") as f:
|
62 |
VectorStore = pickle.load(f)
|
63 |
+
st.text(f"Loaded existing vector store from {vector_store_path}")
|
64 |
else:
|
65 |
# Load and process the PDF, then create the vector store
|
66 |
+
text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200, length_function=len)
|
|
|
67 |
text = load_pdf_text(file_path)
|
68 |
chunks = text_splitter.split_text(text=text)
|
69 |
embeddings = OpenAIEmbeddings()
|
|
|
72 |
# Serialize the vector store
|
73 |
with open(vector_store_path, "wb") as f:
|
74 |
pickle.dump(VectorStore, f)
|
75 |
+
st.text(f"Created and saved vector store at {vector_store_path}")
|
76 |
|
77 |
+
# Change working directory for Git operations
|
78 |
+
original_dir = os.getcwd()
|
79 |
+
os.chdir(local_repo_path)
|
80 |
+
|
81 |
+
try:
|
82 |
+
# Commit and push changes to the repository
|
83 |
+
repo.git_add(vector_store_path) # Stage the file for commit
|
84 |
+
repo.git_commit(f"Update vector store: {store_name}") # Commit the file
|
85 |
+
repo.git_push() # Push the commit to the remote repository
|
86 |
+
st.text("Committed and pushed vector store to repository.")
|
87 |
+
except Exception as e:
|
88 |
+
st.error(f"Error during Git operations: {e}")
|
89 |
+
finally:
|
90 |
+
# Change back to the original directory
|
91 |
+
os.chdir(original_dir)
|
92 |
|
93 |
return VectorStore
|
94 |
|