Tijmen2 commited on
Commit
086415c
·
verified ·
1 Parent(s): 773f3db

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -0
app.py CHANGED
@@ -14,6 +14,7 @@ llm = Llama(
14
  n_ctx=2048,
15
  chat_format="llama-3",
16
  n_gpu_layers=-1, # ensure all layers are on GPU
 
17
  )
18
 
19
  # Placeholder responses for when context is empty
 
14
  n_ctx=2048,
15
  chat_format="llama-3",
16
  n_gpu_layers=-1, # ensure all layers are on GPU
17
+ n_threads=1, # no CPU multi-threading
18
  )
19
 
20
  # Placeholder responses for when context is empty