dh-mc commited on
Commit
1071606
·
1 Parent(s): fc6b2b9

refine TGI parmas

Browse files
Files changed (1) hide show
  1. app_modules/llm_loader.py +3 -3
app_modules/llm_loader.py CHANGED
@@ -191,11 +191,11 @@ class LLMLoader:
191
  self.llm = HuggingFaceTextGenInference(
192
  inference_server_url=HFTGI_SERVER_URL,
193
  max_new_tokens=self.max_tokens_limit / 2,
194
- top_k=10,
195
  top_p=0.95,
196
- typical_p=0.95,
197
  temperature=0.01,
198
- repetition_penalty=1.03,
199
  callbacks=callbacks,
200
  streaming=True,
201
  )
 
191
  self.llm = HuggingFaceTextGenInference(
192
  inference_server_url=HFTGI_SERVER_URL,
193
  max_new_tokens=self.max_tokens_limit / 2,
194
+ # top_k=0,
195
  top_p=0.95,
196
+ # typical_p=0.95,
197
  temperature=0.01,
198
+ repetition_penalty=1.115,
199
  callbacks=callbacks,
200
  streaming=True,
201
  )