bhaskartripathi commited on
Commit
6e8fb2b
·
1 Parent(s): 23d5a88

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -99,7 +99,7 @@ class SemanticSearch:
99
  # return 'Corpus Loaded.'
100
 
101
  # The modified function generates embeddings based on PDF file name and page number and checks if the embeddings file exists before loading or generating it.
102
- def load_recommender(path, start_page=1):
103
  global recommender
104
  pdf_file = os.path.basename(path)
105
  embeddings_file = f"{pdf_file}_{start_page}.npy"
@@ -110,7 +110,7 @@ def load_recommender(path, start_page=1):
110
  recommender.fitted = True
111
  return "Embeddings loaded from file"
112
 
113
- texts = pdf_to_text(path, start_page=start_page)
114
  chunks = text_to_chunks(texts, start_page=start_page)
115
  recommender.fit(chunks)
116
  np.save(embeddings_file, recommender.embeddings)
 
99
  # return 'Corpus Loaded.'
100
 
101
  # The modified function generates embeddings based on PDF file name and page number and checks if the embeddings file exists before loading or generating it.
102
+ def load_recommender(path, start_page=1, end_page=None):
103
  global recommender
104
  pdf_file = os.path.basename(path)
105
  embeddings_file = f"{pdf_file}_{start_page}.npy"
 
110
  recommender.fitted = True
111
  return "Embeddings loaded from file"
112
 
113
+ texts = pdf_to_text(path, start_page=start_page, end_page=end_page)
114
  chunks = text_to_chunks(texts, start_page=start_page)
115
  recommender.fit(chunks)
116
  np.save(embeddings_file, recommender.embeddings)