Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -72,8 +72,8 @@ def generate_response(user_message, history):
|
|
72 |
# top_k=50, # Top-k sampling for efficiency
|
73 |
# pad_token_id=veri_tokenizer.eos_token_id,
|
74 |
# eos_token_id=veri_tokenizer.eos_token_id,
|
75 |
-
|
76 |
-
|
77 |
# length_penalty=1.0,
|
78 |
# early_stopping=True, # Stop early when appropriate
|
79 |
# num_beams=1, # Greedy search for speed
|
|
|
72 |
# top_k=50, # Top-k sampling for efficiency
|
73 |
# pad_token_id=veri_tokenizer.eos_token_id,
|
74 |
# eos_token_id=veri_tokenizer.eos_token_id,
|
75 |
+
use_cache=True, # Enable KV caching for faster generation
|
76 |
+
repetition_penalty=1.1, # Reduce repetition
|
77 |
# length_penalty=1.0,
|
78 |
# early_stopping=True, # Stop early when appropriate
|
79 |
# num_beams=1, # Greedy search for speed
|