Rhulli commited on
Commit
d349d34
·
verified ·
1 Parent(s): a05979c

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -2
app.py CHANGED
@@ -61,9 +61,12 @@ def load_models():
61
 
62
  base_mod = AutoModelForCausalLM.from_pretrained(
63
  BASE_ID,
64
- device_map="auto",
65
- token=HF_TOKEN
 
 
66
  )
 
67
  norm_tok = AutoTokenizer.from_pretrained(ADAPTER_ID, use_fast=True, token=HF_TOKEN)
68
  norm_mod = PeftModel.from_pretrained(
69
  base_mod,
 
61
 
62
  base_mod = AutoModelForCausalLM.from_pretrained(
63
  BASE_ID,
64
+ token=HF_TOKEN,
65
+ device_map="auto", # deja que Accelerate decida
66
+ quantization_config=quant_config,
67
+ offload_folder="/tmp/offload" # ruta temporal de escritura
68
  )
69
+ )
70
  norm_tok = AutoTokenizer.from_pretrained(ADAPTER_ID, use_fast=True, token=HF_TOKEN)
71
  norm_mod = PeftModel.from_pretrained(
72
  base_mod,