refine TGI parmas
Browse files
app_modules/llm_loader.py
CHANGED
@@ -191,11 +191,11 @@ class LLMLoader:
|
|
191 |
self.llm = HuggingFaceTextGenInference(
|
192 |
inference_server_url=HFTGI_SERVER_URL,
|
193 |
max_new_tokens=self.max_tokens_limit / 2,
|
194 |
-
top_k=
|
195 |
top_p=0.95,
|
196 |
-
typical_p=0.95,
|
197 |
temperature=0.01,
|
198 |
-
repetition_penalty=1.
|
199 |
callbacks=callbacks,
|
200 |
streaming=True,
|
201 |
)
|
|
|
191 |
self.llm = HuggingFaceTextGenInference(
|
192 |
inference_server_url=HFTGI_SERVER_URL,
|
193 |
max_new_tokens=self.max_tokens_limit / 2,
|
194 |
+
# top_k=0,
|
195 |
top_p=0.95,
|
196 |
+
# typical_p=0.95,
|
197 |
temperature=0.01,
|
198 |
+
repetition_penalty=1.115,
|
199 |
callbacks=callbacks,
|
200 |
streaming=True,
|
201 |
)
|