Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -141,7 +141,7 @@ def initialize_model():
|
|
141 |
model = AutoModelForCausalLM.from_pretrained(
|
142 |
MODEL_ID,
|
143 |
device_map="cuda",
|
144 |
-
quantization_config=quantization_config,
|
145 |
torch_dtype=torch.bfloat16,
|
146 |
trust_remote_code=True
|
147 |
).to("cuda")
|
@@ -213,7 +213,7 @@ with gr.Blocks(css=CSS, theme=gr.themes.Soft()) as demo:
|
|
213 |
|
214 |
with gr.Accordion("⚙️ Settings", open=False):
|
215 |
system_prompt = gr.TextArea(value=DEFAULT_SYSTEM_PROMPT, label="System Instructions")
|
216 |
-
temperature = gr.Slider(0, 1, value=0.
|
217 |
max_tokens = gr.Slider(128, 8192, value=2048, label="Max Response Length")
|
218 |
|
219 |
clear = gr.Button("Clear History")
|
|
|
141 |
model = AutoModelForCausalLM.from_pretrained(
|
142 |
MODEL_ID,
|
143 |
device_map="cuda",
|
144 |
+
#quantization_config=quantization_config,
|
145 |
torch_dtype=torch.bfloat16,
|
146 |
trust_remote_code=True
|
147 |
).to("cuda")
|
|
|
213 |
|
214 |
with gr.Accordion("⚙️ Settings", open=False):
|
215 |
system_prompt = gr.TextArea(value=DEFAULT_SYSTEM_PROMPT, label="System Instructions")
|
216 |
+
temperature = gr.Slider(0, 1, value=0.3, label="Creativity")
|
217 |
max_tokens = gr.Slider(128, 8192, value=2048, label="Max Response Length")
|
218 |
|
219 |
clear = gr.Button("Clear History")
|