radames commited on
Commit
22938c3
·
1 Parent(s): d4e1d16

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -3
app.py CHANGED
@@ -9,11 +9,13 @@ from huggingface_hub import hf_hub_download # load from huggingfaces
9
 
10
  llm = Llama(
11
  model_path=hf_hub_download(
12
- repo_id="TheBloke/WizardLM-7B-uncensored-GGML",
13
- filename="WizardLM-7B-uncensored.ggmlv3.q4_0.bin",
 
 
14
  ),
15
  n_ctx=2048,
16
- n_gpu_layers=30
17
  ) # download model from hf/ n_ctx=2048 for high ccontext length
18
 
19
  history = []
 
9
 
10
  llm = Llama(
11
  model_path=hf_hub_download(
12
+ # repo_id="TheBloke/WizardLM-7B-uncensored-GGML",
13
+ repo_id="WizardLM-7B-uncensored-GGML",
14
+ # filename="WizardLM-7B-uncensored.ggmlv3.q4_0.bin",
15
+ filename="llama-2-7b-chat.ggmlv3.q5_0.bin",
16
  ),
17
  n_ctx=2048,
18
+ n_gpu_layers=50
19
  ) # download model from hf/ n_ctx=2048 for high ccontext length
20
 
21
  history = []