Spaces:
Paused
Paused
Update llm.py
Browse files
llm.py
CHANGED
|
@@ -5,7 +5,7 @@ import torch
|
|
| 5 |
import asyncio
|
| 6 |
from functools import partial
|
| 7 |
import time
|
| 8 |
-
from transformers import AutoProcessor,
|
| 9 |
|
| 10 |
# Quantization config
|
| 11 |
# quant_config = BitsAndBytesConfig(load_in_8bit=True)
|
|
@@ -14,7 +14,7 @@ model_name="Qwen/Qwen3.5-9B-Base"
|
|
| 14 |
processor = AutoProcessor.from_pretrained(model_name)
|
| 15 |
|
| 16 |
# Load model (auto device mapping)
|
| 17 |
-
model =
|
| 18 |
model_name,
|
| 19 |
# quantization_config=quant_config,
|
| 20 |
device_map="auto",
|
|
|
|
| 5 |
import asyncio
|
| 6 |
from functools import partial
|
| 7 |
import time
|
| 8 |
+
from transformers import AutoProcessor, AutoModelForVision2Seq #, BitsAndBytesConfig
|
| 9 |
|
| 10 |
# Quantization config
|
| 11 |
# quant_config = BitsAndBytesConfig(load_in_8bit=True)
|
|
|
|
| 14 |
processor = AutoProcessor.from_pretrained(model_name)
|
| 15 |
|
| 16 |
# Load model (auto device mapping)
|
| 17 |
+
model = AutoModelForVision2Seq.from_pretrained(
|
| 18 |
model_name,
|
| 19 |
# quantization_config=quant_config,
|
| 20 |
device_map="auto",
|