Luigi commited on
Commit
4443d46
·
1 Parent(s): 4d633ef

adjust thread numbers

Browse files
Files changed (1) hide show
  1. app.py +4 -3
app.py CHANGED
@@ -13,9 +13,10 @@ hf_hub_download(
13
  def load_model():
14
  return Llama(
15
  model_path="models/qwen2.5-1.5b-instruct-q4_k_m.gguf",
16
- n_ctx=2048,
17
- n_threads=6,
18
- n_batch=8,
 
19
  n_gpu_layers=0,
20
  use_mlock=False,
21
  use_mmap=True,
 
13
  def load_model():
14
  return Llama(
15
  model_path="models/qwen2.5-1.5b-instruct-q4_k_m.gguf",
16
+ n_ctx=1024,
17
+ n_threads=2,
18
+ n_threads_batch=2,
19
+ n_batch=4,
20
  n_gpu_layers=0,
21
  use_mlock=False,
22
  use_mmap=True,