wakeupmh commited on
Commit
5f3cb01
·
1 Parent(s): f3bc435

fix: cuda error

Browse files
Files changed (2) hide show
  1. app.py +7 -2
  2. requirements.txt +2 -1
app.py CHANGED
@@ -18,8 +18,13 @@ DATASET_PATH = os.path.join(DATASET_DIR, "dataset")
18
  @st.cache_resource
19
  def load_models():
20
  model_name = "google/flan-t5-small" # Lighter model
21
- tokenizer = AutoTokenizer.from_pretrained(model_name, device_map="auto")
22
- model = AutoModelForSeq2SeqLM.from_pretrained(model_name, device_map="auto", load_in_8bit=True)
 
 
 
 
 
23
  return tokenizer, model
24
 
25
  @st.cache_data
 
18
  @st.cache_resource
19
  def load_models():
20
  model_name = "google/flan-t5-small" # Lighter model
21
+ tokenizer = AutoTokenizer.from_pretrained(model_name)
22
+ model = AutoModelForSeq2SeqLM.from_pretrained(
23
+ model_name,
24
+ device_map="auto",
25
+ load_in_8bit=True,
26
+ trust_remote_code=True
27
+ )
28
  return tokenizer, model
29
 
30
  @st.cache_data
requirements.txt CHANGED
@@ -4,6 +4,7 @@ datasets
4
  sentence-transformers
5
  faiss-cpu
6
  arxiv
7
- torch --index-url https://download.pytorch.org/whl/cpu
 
8
  accelerate>=0.26.0
9
  bitsandbytes>=0.41.1
 
4
  sentence-transformers
5
  faiss-cpu
6
  arxiv
7
+ --extra-index-url https://download.pytorch.org/whl/cpu
8
+ torch
9
  accelerate>=0.26.0
10
  bitsandbytes>=0.41.1