Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -9,13 +9,11 @@ from huggingface_hub import hf_hub_download # load from huggingfaces
|
|
9 |
|
10 |
llm = Llama(
|
11 |
model_path=hf_hub_download(
|
12 |
-
# repo_id="TheBloke/WizardLM-7B-uncensored-GGML",
|
13 |
repo_id="TheBloke/Llama-2-7B-Chat-GGML",
|
14 |
-
# filename="WizardLM-7B-uncensored.ggmlv3.q4_0.bin",
|
15 |
filename="llama-2-7b-chat.ggmlv3.q5_0.bin",
|
16 |
),
|
17 |
n_ctx=2048,
|
18 |
-
n_gpu_layers=
|
19 |
) # download model from hf/ n_ctx=2048 for high ccontext length
|
20 |
|
21 |
history = []
|
|
|
9 |
|
10 |
llm = Llama(
|
11 |
model_path=hf_hub_download(
|
|
|
12 |
repo_id="TheBloke/Llama-2-7B-Chat-GGML",
|
|
|
13 |
filename="llama-2-7b-chat.ggmlv3.q5_0.bin",
|
14 |
),
|
15 |
n_ctx=2048,
|
16 |
+
n_gpu_layers=500,
|
17 |
) # download model from hf/ n_ctx=2048 for high ccontext length
|
18 |
|
19 |
history = []
|