Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
|
@@ -20,13 +20,13 @@ LICENSE = """
|
|
| 20 |
<p/>
|
| 21 |
---
|
| 22 |
Chat with Buzz-small!
|
| 23 |
-
only 3b, this demo runs on the
|
| 24 |
"""
|
| 25 |
|
| 26 |
device = 0 if torch.cuda.is_available() else -1
|
| 27 |
|
| 28 |
model_id = "H-D-T/Buzz-3b-small-v0.6.3"
|
| 29 |
-
chatbot = pipeline(model=model_id, device=device, task="
|
| 30 |
|
| 31 |
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
| 32 |
bos_token = "<|begin_of_text|>"
|
|
|
|
| 20 |
<p/>
|
| 21 |
---
|
| 22 |
Chat with Buzz-small!
|
| 23 |
+
only 3b, this demo runs on the fp8 weights of the model in pytorch format, its brains are probably significantly damaged, converting to cpp soon, dont worry!
|
| 24 |
"""
|
| 25 |
|
| 26 |
device = 0 if torch.cuda.is_available() else -1
|
| 27 |
|
| 28 |
model_id = "H-D-T/Buzz-3b-small-v0.6.3"
|
| 29 |
+
chatbot = pipeline(model=model_id, device=device, task="conversationa",model_kwargs={"load_in_8bit": True})
|
| 30 |
|
| 31 |
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
| 32 |
bos_token = "<|begin_of_text|>"
|