ccm commited on
Commit
3f9aea7
·
verified ·
1 Parent(s): 1157109

Update main.py

Browse files
Files changed (1) hide show
  1. main.py +2 -1
main.py CHANGED
@@ -30,7 +30,8 @@ EMBEDDING_MODEL_NAME = "allenai-specter"
30
  LLM_MODEL_NAME = "Qwen/Qwen2-7B-Instruct"
31
 
32
  # Load the dataset and convert to pandas
33
- data = datasets.load_dataset("ccm/publications")["train"].to_pandas()
 
34
 
35
  # Filter out any publications without an abstract
36
  abstract_is_null = [
 
30
  LLM_MODEL_NAME = "Qwen/Qwen2-7B-Instruct"
31
 
32
  # Load the dataset and convert to pandas
33
+ # data = datasets.load_dataset("ccm/publications")["train"].to_pandas()
34
+ data = pandas.read_parquet("hf://datasets/ccm/publications/data/train-00000-of-00001.parquet")
35
 
36
  # Filter out any publications without an abstract
37
  abstract_is_null = [