Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
|
@@ -49,15 +49,12 @@ def load_models():
|
|
| 49 |
model_name = "deepseek-ai/DeepSeek-R1-Distill-Llama-8B"
|
| 50 |
app.state.deepseek_tokenizer = AutoTokenizer.from_pretrained(model_name)
|
| 51 |
app.state.deepseek_tokenizer.pad_token = app.state.deepseek_tokenizer.eos_token
|
| 52 |
-
|
| 53 |
app.state.deepseek_model = AutoModelForCausalLM.from_pretrained(
|
| 54 |
model_name,
|
| 55 |
-
|
| 56 |
-
device_map="auto",
|
| 57 |
-
offload_folder="offload" # folder to store offloaded weights
|
| 58 |
)
|
| 59 |
|
| 60 |
-
|
| 61 |
# -----------------------------
|
| 62 |
# Model handlers
|
| 63 |
# -----------------------------
|
|
|
|
| 49 |
model_name = "deepseek-ai/DeepSeek-R1-Distill-Llama-8B"
|
| 50 |
app.state.deepseek_tokenizer = AutoTokenizer.from_pretrained(model_name)
|
| 51 |
app.state.deepseek_tokenizer.pad_token = app.state.deepseek_tokenizer.eos_token
|
| 52 |
+
|
| 53 |
app.state.deepseek_model = AutoModelForCausalLM.from_pretrained(
|
| 54 |
model_name,
|
| 55 |
+
load_in_8bit=True, # requires bitsandbytes device_map="auto"
|
|
|
|
|
|
|
| 56 |
)
|
| 57 |
|
|
|
|
| 58 |
# -----------------------------
|
| 59 |
# Model handlers
|
| 60 |
# -----------------------------
|