Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -12,7 +12,7 @@ llm = Llama(
|
|
12 |
filename="llama-2-7b-chat.ggmlv3.q5_0.bin",
|
13 |
),
|
14 |
n_ctx=2048,
|
15 |
-
n_gpu_layers=
|
16 |
)
|
17 |
|
18 |
history = []
|
@@ -61,6 +61,8 @@ demo = gr.ChatInterface(
|
|
61 |
generate_text,
|
62 |
title="llama-cpp-python on GPU",
|
63 |
description="Running LLM with https://github.com/abetlen/llama-cpp-python",
|
|
|
|
|
64 |
retry_btn=None,
|
65 |
undo_btn="Delete Previous",
|
66 |
clear_btn="Clear",
|
|
|
12 |
filename="llama-2-7b-chat.ggmlv3.q5_0.bin",
|
13 |
),
|
14 |
n_ctx=2048,
|
15 |
+
n_gpu_layers=5000, # change n_gpu_layers if you have more or less VRAM
|
16 |
)
|
17 |
|
18 |
history = []
|
|
|
61 |
generate_text,
|
62 |
title="llama-cpp-python on GPU",
|
63 |
description="Running LLM with https://github.com/abetlen/llama-cpp-python",
|
64 |
+
examples=["tell me everything about llamas"],
|
65 |
+
cache_examples=True,
|
66 |
retry_btn=None,
|
67 |
undo_btn="Delete Previous",
|
68 |
clear_btn="Clear",
|