Spaces:
Runtime error
Runtime error
Commit
·
6e8fb2b
1
Parent(s):
23d5a88
Update app.py
Browse files
app.py
CHANGED
@@ -99,7 +99,7 @@ class SemanticSearch:
|
|
99 |
# return 'Corpus Loaded.'
|
100 |
|
101 |
# The modified function generates embeddings based on PDF file name and page number and checks if the embeddings file exists before loading or generating it.
|
102 |
-
def load_recommender(path, start_page=1):
|
103 |
global recommender
|
104 |
pdf_file = os.path.basename(path)
|
105 |
embeddings_file = f"{pdf_file}_{start_page}.npy"
|
@@ -110,7 +110,7 @@ def load_recommender(path, start_page=1):
|
|
110 |
recommender.fitted = True
|
111 |
return "Embeddings loaded from file"
|
112 |
|
113 |
-
texts = pdf_to_text(path, start_page=start_page)
|
114 |
chunks = text_to_chunks(texts, start_page=start_page)
|
115 |
recommender.fit(chunks)
|
116 |
np.save(embeddings_file, recommender.embeddings)
|
|
|
99 |
# return 'Corpus Loaded.'
|
100 |
|
101 |
# The modified function generates embeddings based on PDF file name and page number and checks if the embeddings file exists before loading or generating it.
|
102 |
+
def load_recommender(path, start_page=1, end_page=None):
|
103 |
global recommender
|
104 |
pdf_file = os.path.basename(path)
|
105 |
embeddings_file = f"{pdf_file}_{start_page}.npy"
|
|
|
110 |
recommender.fitted = True
|
111 |
return "Embeddings loaded from file"
|
112 |
|
113 |
+
texts = pdf_to_text(path, start_page=start_page, end_page=end_page)
|
114 |
chunks = text_to_chunks(texts, start_page=start_page)
|
115 |
recommender.fit(chunks)
|
116 |
np.save(embeddings_file, recommender.embeddings)
|