Spaces:
Sleeping
Sleeping
Update rag.py
Browse files
rag.py
CHANGED
@@ -10,6 +10,14 @@ from langchain.vectorstores.utils import filter_complex_metadata
|
|
10 |
#add new import
|
11 |
from langchain_community.document_loaders.csv_loader import CSVLoader
|
12 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
13 |
|
14 |
|
15 |
class ChatPDF:
|
@@ -38,7 +46,7 @@ class ChatPDF:
|
|
38 |
chunks = self.text_splitter.split_documents(docs)
|
39 |
chunks = filter_complex_metadata(chunks)
|
40 |
|
41 |
-
vector_store = Chroma.from_documents(documents=chunks, embedding=
|
42 |
self.retriever = vector_store.as_retriever(
|
43 |
search_type="similarity_score_threshold",
|
44 |
search_kwargs={
|
|
|
10 |
#add new import
|
11 |
from langchain_community.document_loaders.csv_loader import CSVLoader
|
12 |
|
13 |
+
from sentence_transformers import SentenceTransformer
|
14 |
+
|
15 |
+
from langchain_community.embeddings import HuggingFaceEmbeddings
|
16 |
+
model_name = "sentence-transformers/all-mpnet-base-v2"
|
17 |
+
embedding = HuggingFaceEmbeddings(
|
18 |
+
model_name=model_name,
|
19 |
+
)
|
20 |
+
|
21 |
|
22 |
|
23 |
class ChatPDF:
|
|
|
46 |
chunks = self.text_splitter.split_documents(docs)
|
47 |
chunks = filter_complex_metadata(chunks)
|
48 |
|
49 |
+
vector_store = Chroma.from_documents(documents=chunks, embedding=embedding)
|
50 |
self.retriever = vector_store.as_retriever(
|
51 |
search_type="similarity_score_threshold",
|
52 |
search_kwargs={
|