Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -20,13 +20,13 @@ LICENSE = """
|
|
20 |
<p/>
|
21 |
---
|
22 |
Chat with Buzz-small!
|
23 |
-
only 3b, this demo runs on the
|
24 |
"""
|
25 |
|
26 |
device = 0 if torch.cuda.is_available() else -1
|
27 |
|
28 |
model_id = "H-D-T/Buzz-3b-small-v0.6.3"
|
29 |
-
chatbot = pipeline(model=model_id, device=device, task="
|
30 |
|
31 |
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
32 |
bos_token = "<|begin_of_text|>"
|
|
|
20 |
<p/>
|
21 |
---
|
22 |
Chat with Buzz-small!
|
23 |
+
only 3b, this demo runs on the fp8 weights of the model in pytorch format, its brains are probably significantly damaged, converting to cpp soon, dont worry!
|
24 |
"""
|
25 |
|
26 |
device = 0 if torch.cuda.is_available() else -1
|
27 |
|
28 |
model_id = "H-D-T/Buzz-3b-small-v0.6.3"
|
29 |
+
chatbot = pipeline(model=model_id, device=device, task="conversationa",model_kwargs={"load_in_8bit": True})
|
30 |
|
31 |
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
32 |
bos_token = "<|begin_of_text|>"
|