Jiangxz commited on
Commit
76a8f0a
Β·
verified Β·
1 Parent(s): 8a7b2f1

Upload app.py

Browse files
Files changed (1) hide show
  1. app.py +10 -2
app.py CHANGED
@@ -54,7 +54,15 @@ sources = [
54
  "TaxQADataSet_ntpc1.txt",
55
  "TaxQADataSet_ntpc2.txt",
56
  "TaxQADataSet_kctax.txt",
57
- "TaxQADataSet_chutax.txt"
 
 
 
 
 
 
 
 
58
  ]
59
 
60
  documents = load_documents(sources)
@@ -70,7 +78,7 @@ text_splitter = RecursiveCharacterTextSplitter(
70
  split_docs = text_splitter.split_documents(documents)
71
  print(f"εˆ†ε‰²εΎŒηš„ζ–‡δ»Άζ•Έι‡οΌš{len(split_docs)}")
72
 
73
- embeddings = HuggingFaceEmbeddings(model_name="BAAI/bge-m3")
74
  print(f"\nζˆεŠŸεˆε§‹εŒ–ε΅Œε…₯ζ¨‘εž‹")
75
 
76
  print(f"開始建立向量資料庫")
 
54
  "TaxQADataSet_ntpc1.txt",
55
  "TaxQADataSet_ntpc2.txt",
56
  "TaxQADataSet_kctax.txt",
57
+ "TaxQADataSet_chutax.txt",
58
+ "HouseTaxAct1130103.txt",
59
+ "VehicleLicenseTaxAct1101230.txt",
60
+ "TaxCollectionAct1101217.txt",
61
+ "LandTaxAct1100623.txt",
62
+ "AmusementTaxAct960523.txt",
63
+ "StampTaxAct910515.txt",
64
+ "DeedTaxAct990505.txt",
65
+ "ProgressiveHouseTaxRates1130701.txt"
66
  ]
67
 
68
  documents = load_documents(sources)
 
78
  split_docs = text_splitter.split_documents(documents)
79
  print(f"εˆ†ε‰²εΎŒηš„ζ–‡δ»Άζ•Έι‡οΌš{len(split_docs)}")
80
 
81
+ embeddings = HuggingFaceEmbeddings(model_name="BAAI/bge-large-zh-v1.5")
82
  print(f"\nζˆεŠŸεˆε§‹εŒ–ε΅Œε…₯ζ¨‘εž‹")
83
 
84
  print(f"開始建立向量資料庫")