arjunanand13 commited on
Commit
9adf9a9
·
verified ·
1 Parent(s): 29c5a5c

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -28,7 +28,7 @@ class DocumentRetrievalAndGeneration:
28
  def load_documents(self, folder_path):
29
  loader = DirectoryLoader(folder_path, loader_cls=TextLoader)
30
  documents = loader.load()
31
- text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=125)
32
  all_splits = text_splitter.split_documents(documents)
33
  print('Length of documents:', len(documents))
34
  print("LEN of all_splits", len(all_splits))
@@ -52,7 +52,7 @@ class DocumentRetrievalAndGeneration:
52
  def create_faiss_index(self):
53
  all_texts = [split.page_content for split in self.all_splits]
54
 
55
- batch_size = 1024
56
  all_embeddings = []
57
 
58
  for i in range(0, len(all_texts), batch_size):
 
28
  def load_documents(self, folder_path):
29
  loader = DirectoryLoader(folder_path, loader_cls=TextLoader)
30
  documents = loader.load()
31
+ text_splitter = RecursiveCharacterTextSplitter(chunk_size=5000, chunk_overlap=250)
32
  all_splits = text_splitter.split_documents(documents)
33
  print('Length of documents:', len(documents))
34
  print("LEN of all_splits", len(all_splits))
 
52
  def create_faiss_index(self):
53
  all_texts = [split.page_content for split in self.all_splits]
54
 
55
+ batch_size = 256
56
  all_embeddings = []
57
 
58
  for i in range(0, len(all_texts), batch_size):