Aleksandr Maiorov commited on
Commit
260686e
·
1 Parent(s): 11122fa

v0.6.2 - просто апи для генерации текста

Browse files
Files changed (1) hide show
  1. app.py +2 -3
app.py CHANGED
@@ -42,10 +42,9 @@ try:
42
  LLM = Llama.from_pretrained(
43
  repo_id=REPO_ID,
44
  filename='Vikhr-Qwen-2.5-1.5b-Instruct-Q8_0.gguf',
45
- n_threads=2,
46
- n_batch=512,
47
  n_gpu_layers=-1,
48
- n_ctx=4096,
49
  temperature=0.3,
50
  num_return_sequences=1,
51
  no_repeat_ngram_size=2,
 
42
  LLM = Llama.from_pretrained(
43
  repo_id=REPO_ID,
44
  filename='Vikhr-Qwen-2.5-1.5b-Instruct-Q8_0.gguf',
45
+ n_threads=4,
 
46
  n_gpu_layers=-1,
47
+ n_ctx=1512,
48
  temperature=0.3,
49
  num_return_sequences=1,
50
  no_repeat_ngram_size=2,