Spaces:
Running
Running
optimize
Browse files
starvector/serve/conversation.py
CHANGED
|
@@ -124,7 +124,7 @@ class Conversation:
|
|
| 124 |
try:
|
| 125 |
result = future.result(timeout=0.1) # Specify the timeout duration in seconds
|
| 126 |
except concurrent.futures.TimeoutError:
|
| 127 |
-
print("Timeout occurred!")
|
| 128 |
result = None
|
| 129 |
return result
|
| 130 |
|
|
|
|
| 124 |
try:
|
| 125 |
result = future.result(timeout=0.1) # Specify the timeout duration in seconds
|
| 126 |
except concurrent.futures.TimeoutError:
|
| 127 |
+
# print("Timeout occurred!")
|
| 128 |
result = None
|
| 129 |
return result
|
| 130 |
|
starvector/serve/vllm_api_gradio/gradio_web_server.py
CHANGED
|
@@ -576,7 +576,7 @@ def build_demo(embed_mode):
|
|
| 576 |
temperature = gr.Slider(minimum=0.0, maximum=2.0, value=0.2, step=0.05, interactive=True, label="Temperature",)
|
| 577 |
len_penalty = gr.Slider(minimum=0.0, maximum=2.0, value=1.0, step=0.05, interactive=True, label="Length Penalty",)
|
| 578 |
top_p = gr.Slider(minimum=0.0, maximum=1.0, value=0.95, step=0.05, interactive=True, label="Top P",)
|
| 579 |
-
max_output_tokens = gr.Slider(minimum=0, maximum=
|
| 580 |
|
| 581 |
with gr.Column(scale=9):
|
| 582 |
with gr.Row():
|
|
|
|
| 576 |
temperature = gr.Slider(minimum=0.0, maximum=2.0, value=0.2, step=0.05, interactive=True, label="Temperature",)
|
| 577 |
len_penalty = gr.Slider(minimum=0.0, maximum=2.0, value=1.0, step=0.05, interactive=True, label="Length Penalty",)
|
| 578 |
top_p = gr.Slider(minimum=0.0, maximum=1.0, value=0.95, step=0.05, interactive=True, label="Top P",)
|
| 579 |
+
max_output_tokens = gr.Slider(minimum=0, maximum=1024, value=1024, step=64, interactive=True, label="Max output tokens",)
|
| 580 |
|
| 581 |
with gr.Column(scale=9):
|
| 582 |
with gr.Row():
|