using data.dir for datasets
Browse files
app.py
CHANGED
@@ -5,6 +5,7 @@ import faiss
|
|
5 |
import numpy as np
|
6 |
import os
|
7 |
import time
|
|
|
8 |
|
9 |
# β
Ensure FAISS is installed
|
10 |
os.system("pip install faiss-cpu")
|
@@ -12,15 +13,32 @@ os.system("pip install faiss-cpu")
|
|
12 |
def log(message):
|
13 |
print(f"β
{message}")
|
14 |
|
15 |
-
|
16 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
17 |
datasets = {
|
18 |
-
"sales":
|
19 |
-
"blended":
|
20 |
-
"dialog":
|
21 |
-
"multiwoz":
|
22 |
}
|
23 |
-
|
|
|
|
|
24 |
|
25 |
# β
Step 1: Run Embedding Script (Import and Run)
|
26 |
log("π Running embeddings script...")
|
|
|
5 |
import numpy as np
|
6 |
import os
|
7 |
import time
|
8 |
+
import json
|
9 |
|
10 |
# β
Ensure FAISS is installed
|
11 |
os.system("pip install faiss-cpu")
|
|
|
13 |
def log(message):
|
14 |
print(f"β
{message}")
|
15 |
|
16 |
+
|
17 |
+
DATA_DIR = "data"
|
18 |
+
|
19 |
+
def load_local_dataset(dataset_name):
|
20 |
+
"""Load a dataset from a JSON file."""
|
21 |
+
file_path = os.path.join(DATA_DIR, f"{dataset_name}.json")
|
22 |
+
|
23 |
+
if os.path.exists(file_path):
|
24 |
+
with open(file_path, "r") as f:
|
25 |
+
data = json.load(f)
|
26 |
+
print(f"β
Loaded {dataset_name} from {file_path}")
|
27 |
+
return data
|
28 |
+
else:
|
29 |
+
print(f"β ERROR: {dataset_name} file not found!")
|
30 |
+
return None
|
31 |
+
|
32 |
+
# β
Load all datasets from local storage
|
33 |
datasets = {
|
34 |
+
"sales": load_local_dataset("sales"),
|
35 |
+
"blended": load_local_dataset("blended"),
|
36 |
+
"dialog": load_local_dataset("dialog"),
|
37 |
+
"multiwoz": load_local_dataset("multiwoz"),
|
38 |
}
|
39 |
+
|
40 |
+
print("β
Datasets loaded from local storage!")
|
41 |
+
|
42 |
|
43 |
# β
Step 1: Run Embedding Script (Import and Run)
|
44 |
log("π Running embeddings script...")
|