Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -61,9 +61,12 @@ def load_models():
|
|
| 61 |
|
| 62 |
base_mod = AutoModelForCausalLM.from_pretrained(
|
| 63 |
BASE_ID,
|
| 64 |
-
|
| 65 |
-
|
|
|
|
|
|
|
| 66 |
)
|
|
|
|
| 67 |
norm_tok = AutoTokenizer.from_pretrained(ADAPTER_ID, use_fast=True, token=HF_TOKEN)
|
| 68 |
norm_mod = PeftModel.from_pretrained(
|
| 69 |
base_mod,
|
|
|
|
| 61 |
|
| 62 |
base_mod = AutoModelForCausalLM.from_pretrained(
|
| 63 |
BASE_ID,
|
| 64 |
+
token=HF_TOKEN,
|
| 65 |
+
device_map="auto", # deja que Accelerate decida
|
| 66 |
+
quantization_config=quant_config,
|
| 67 |
+
offload_folder="/tmp/offload" # ruta temporal de escritura
|
| 68 |
)
|
| 69 |
+
)
|
| 70 |
norm_tok = AutoTokenizer.from_pretrained(ADAPTER_ID, use_fast=True, token=HF_TOKEN)
|
| 71 |
norm_mod = PeftModel.from_pretrained(
|
| 72 |
base_mod,
|