hz2475 commited on
Commit
071dd9a
·
1 Parent(s): 4cf9521
starvector/serve/conversation.py CHANGED
@@ -124,7 +124,7 @@ class Conversation:
124
  try:
125
  result = future.result(timeout=0.1) # Specify the timeout duration in seconds
126
  except concurrent.futures.TimeoutError:
127
- print("Timeout occurred!")
128
  result = None
129
  return result
130
 
 
124
  try:
125
  result = future.result(timeout=0.1) # Specify the timeout duration in seconds
126
  except concurrent.futures.TimeoutError:
127
+ # print("Timeout occurred!")
128
  result = None
129
  return result
130
 
starvector/serve/vllm_api_gradio/gradio_web_server.py CHANGED
@@ -576,7 +576,7 @@ def build_demo(embed_mode):
576
  temperature = gr.Slider(minimum=0.0, maximum=2.0, value=0.2, step=0.05, interactive=True, label="Temperature",)
577
  len_penalty = gr.Slider(minimum=0.0, maximum=2.0, value=1.0, step=0.05, interactive=True, label="Length Penalty",)
578
  top_p = gr.Slider(minimum=0.0, maximum=1.0, value=0.95, step=0.05, interactive=True, label="Top P",)
579
- max_output_tokens = gr.Slider(minimum=0, maximum=8192, value=8192, step=64, interactive=True, label="Max output tokens",)
580
 
581
  with gr.Column(scale=9):
582
  with gr.Row():
 
576
  temperature = gr.Slider(minimum=0.0, maximum=2.0, value=0.2, step=0.05, interactive=True, label="Temperature",)
577
  len_penalty = gr.Slider(minimum=0.0, maximum=2.0, value=1.0, step=0.05, interactive=True, label="Length Penalty",)
578
  top_p = gr.Slider(minimum=0.0, maximum=1.0, value=0.95, step=0.05, interactive=True, label="Top P",)
579
+ max_output_tokens = gr.Slider(minimum=0, maximum=1024, value=1024, step=64, interactive=True, label="Max output tokens",)
580
 
581
  with gr.Column(scale=9):
582
  with gr.Row():