optimize
Browse files
starvector/serve/conversation.py
CHANGED
@@ -124,7 +124,7 @@ class Conversation:
|
|
124 |
try:
|
125 |
result = future.result(timeout=0.1) # Specify the timeout duration in seconds
|
126 |
except concurrent.futures.TimeoutError:
|
127 |
-
print("Timeout occurred!")
|
128 |
result = None
|
129 |
return result
|
130 |
|
|
|
124 |
try:
|
125 |
result = future.result(timeout=0.1) # Specify the timeout duration in seconds
|
126 |
except concurrent.futures.TimeoutError:
|
127 |
+
# print("Timeout occurred!")
|
128 |
result = None
|
129 |
return result
|
130 |
|
starvector/serve/vllm_api_gradio/gradio_web_server.py
CHANGED
@@ -576,7 +576,7 @@ def build_demo(embed_mode):
|
|
576 |
temperature = gr.Slider(minimum=0.0, maximum=2.0, value=0.2, step=0.05, interactive=True, label="Temperature",)
|
577 |
len_penalty = gr.Slider(minimum=0.0, maximum=2.0, value=1.0, step=0.05, interactive=True, label="Length Penalty",)
|
578 |
top_p = gr.Slider(minimum=0.0, maximum=1.0, value=0.95, step=0.05, interactive=True, label="Top P",)
|
579 |
-
max_output_tokens = gr.Slider(minimum=0, maximum=
|
580 |
|
581 |
with gr.Column(scale=9):
|
582 |
with gr.Row():
|
|
|
576 |
temperature = gr.Slider(minimum=0.0, maximum=2.0, value=0.2, step=0.05, interactive=True, label="Temperature",)
|
577 |
len_penalty = gr.Slider(minimum=0.0, maximum=2.0, value=1.0, step=0.05, interactive=True, label="Length Penalty",)
|
578 |
top_p = gr.Slider(minimum=0.0, maximum=1.0, value=0.95, step=0.05, interactive=True, label="Top P",)
|
579 |
+
max_output_tokens = gr.Slider(minimum=0, maximum=1024, value=1024, step=64, interactive=True, label="Max output tokens",)
|
580 |
|
581 |
with gr.Column(scale=9):
|
582 |
with gr.Row():
|