samim2024 commited on
Commit
85cdbf8
·
verified ·
1 Parent(s): 640cf86

Update rag.py

Browse files
Files changed (1) hide show
  1. rag.py +9 -1
rag.py CHANGED
@@ -10,6 +10,14 @@ from langchain.vectorstores.utils import filter_complex_metadata
10
  #add new import
11
  from langchain_community.document_loaders.csv_loader import CSVLoader
12
 
 
 
 
 
 
 
 
 
13
 
14
 
15
  class ChatPDF:
@@ -38,7 +46,7 @@ class ChatPDF:
38
  chunks = self.text_splitter.split_documents(docs)
39
  chunks = filter_complex_metadata(chunks)
40
 
41
- vector_store = Chroma.from_documents(documents=chunks, embedding=FastEmbedEmbeddings())
42
  self.retriever = vector_store.as_retriever(
43
  search_type="similarity_score_threshold",
44
  search_kwargs={
 
10
  #add new import
11
  from langchain_community.document_loaders.csv_loader import CSVLoader
12
 
13
+ from sentence_transformers import SentenceTransformer
14
+
15
+ from langchain_community.embeddings import HuggingFaceEmbeddings
16
+ model_name = "sentence-transformers/all-mpnet-base-v2"
17
+ embedding = HuggingFaceEmbeddings(
18
+ model_name=model_name,
19
+ )
20
+
21
 
22
 
23
  class ChatPDF:
 
46
  chunks = self.text_splitter.split_documents(docs)
47
  chunks = filter_complex_metadata(chunks)
48
 
49
+ vector_store = Chroma.from_documents(documents=chunks, embedding=embedding)
50
  self.retriever = vector_store.as_retriever(
51
  search_type="similarity_score_threshold",
52
  search_kwargs={