Update app.py
Browse files
app.py
CHANGED
@@ -50,7 +50,7 @@ def respond(
|
|
50 |
llm = Llama(
|
51 |
model_path=f"models/{model}",
|
52 |
flash_attn=True,
|
53 |
-
n_threads=
|
54 |
n_gpu_layers=81,
|
55 |
n_batch=1024,
|
56 |
n_ctx=8192,
|
|
|
50 |
llm = Llama(
|
51 |
model_path=f"models/{model}",
|
52 |
flash_attn=True,
|
53 |
+
n_threads=40,
|
54 |
n_gpu_layers=81,
|
55 |
n_batch=1024,
|
56 |
n_ctx=8192,
|