pabloce commited on
Commit
ac67876
·
verified ·
1 Parent(s): c6c615b

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -1
app.py CHANGED
@@ -48,7 +48,11 @@ def respond(
48
  settings.temperature = temperature
49
  settings.top_p = top_p
50
 
51
- return agent.get_chat_response(message, llm_sampling_settings=settings, returns_streaming_generator=True)
 
 
 
 
52
  # stop_tokens = ["</s>", "[INST]", "[INST] ", "<s>", "[/INST]", "[/INST] "]
53
  # chat_template = '<s>[INST] ' + system_message
54
  # # for human, assistant in history:
 
48
  settings.temperature = temperature
49
  settings.top_p = top_p
50
 
51
+ for new_token in agent.get_chat_response(message, llm_sampling_settings=settings, returns_streaming_generator=True):
52
+ partial_message += new_token
53
+ if '<|im_end|>' in partial_message:
54
+ break
55
+ yield partial_message
56
  # stop_tokens = ["</s>", "[INST]", "[INST] ", "<s>", "[/INST]", "[/INST] "]
57
  # chat_template = '<s>[INST] ' + system_message
58
  # # for human, assistant in history: