Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -66,6 +66,8 @@ def stream_chat(
|
|
66 |
])
|
67 |
|
68 |
conversation.append({"role": "user", "content": message})
|
|
|
|
|
69 |
|
70 |
input_text = tokenizer.apply_chat_template(conversation, tokenize=False, add_generation_prompt=True)
|
71 |
inputs = tokenizer.encode(input_text, return_tensors="pt").to(device)
|
@@ -110,7 +112,7 @@ with gr.Blocks(theme="JohnSmith9982/small_and_pretty") as demo:
|
|
110 |
additional_inputs_accordion=gr.Accordion(label="⚙️ Parameters", open=False, render=False),
|
111 |
additional_inputs=[
|
112 |
gr.Slider(minimum=0, maximum=1, step=0.1, value=0.3, label="Temperature", render=False),
|
113 |
-
gr.Slider(minimum=128, maximum=32768, step=1, value=
|
114 |
gr.Slider(minimum=0.0, maximum=1.0, step=0.1, value=1.0, label="top_p", render=False),
|
115 |
gr.Slider(minimum=1, maximum=20, step=1, value=20, label="top_k", render=False),
|
116 |
gr.Slider(minimum=0.0, maximum=2.0, step=0.1, value=1.2, label="Repetition penalty", render=False),
|
|
|
66 |
])
|
67 |
|
68 |
conversation.append({"role": "user", "content": message})
|
69 |
+
|
70 |
+
print(message)
|
71 |
|
72 |
input_text = tokenizer.apply_chat_template(conversation, tokenize=False, add_generation_prompt=True)
|
73 |
inputs = tokenizer.encode(input_text, return_tensors="pt").to(device)
|
|
|
112 |
additional_inputs_accordion=gr.Accordion(label="⚙️ Parameters", open=False, render=False),
|
113 |
additional_inputs=[
|
114 |
gr.Slider(minimum=0, maximum=1, step=0.1, value=0.3, label="Temperature", render=False),
|
115 |
+
gr.Slider(minimum=128, maximum=32768, step=1, value=4096, label="Max new tokens", render=False),
|
116 |
gr.Slider(minimum=0.0, maximum=1.0, step=0.1, value=1.0, label="top_p", render=False),
|
117 |
gr.Slider(minimum=1, maximum=20, step=1, value=20, label="top_k", render=False),
|
118 |
gr.Slider(minimum=0.0, maximum=2.0, step=0.1, value=1.2, label="Repetition penalty", render=False),
|