Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -28,7 +28,7 @@ class DocumentRetrievalAndGeneration:
|
|
28 |
def load_documents(self, folder_path):
|
29 |
loader = DirectoryLoader(folder_path, loader_cls=TextLoader)
|
30 |
documents = loader.load()
|
31 |
-
text_splitter = RecursiveCharacterTextSplitter(chunk_size=
|
32 |
all_splits = text_splitter.split_documents(documents)
|
33 |
print('Length of documents:', len(documents))
|
34 |
print("LEN of all_splits", len(all_splits))
|
@@ -52,7 +52,7 @@ class DocumentRetrievalAndGeneration:
|
|
52 |
def create_faiss_index(self):
|
53 |
all_texts = [split.page_content for split in self.all_splits]
|
54 |
|
55 |
-
batch_size =
|
56 |
all_embeddings = []
|
57 |
|
58 |
for i in range(0, len(all_texts), batch_size):
|
|
|
28 |
def load_documents(self, folder_path):
|
29 |
loader = DirectoryLoader(folder_path, loader_cls=TextLoader)
|
30 |
documents = loader.load()
|
31 |
+
text_splitter = RecursiveCharacterTextSplitter(chunk_size=5000, chunk_overlap=250)
|
32 |
all_splits = text_splitter.split_documents(documents)
|
33 |
print('Length of documents:', len(documents))
|
34 |
print("LEN of all_splits", len(all_splits))
|
|
|
52 |
def create_faiss_index(self):
|
53 |
all_texts = [split.page_content for split in self.all_splits]
|
54 |
|
55 |
+
batch_size = 256
|
56 |
all_embeddings = []
|
57 |
|
58 |
for i in range(0, len(all_texts), batch_size):
|