Monimoy commited on
Commit
7cd74fe
·
verified ·
1 Parent(s): 474f9e8

Upload app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -24,8 +24,8 @@ peft_model_path = "./phi2-openassistant-lora-final"
24
  #bnb_4bit_use_double_quant=True,
25
  #)
26
  #base_model = AutoModelForCausalLM.from_pretrained(base_model_name, quantization_config=bnb_config, device_map={"": device})
27
- base_model = AutoModelForCausalLM.from_pretrained(base_model_name, model_type="llama", device_map={"": device}, quantization="4bit")
28
-
29
 
30
 
31
 
 
24
  #bnb_4bit_use_double_quant=True,
25
  #)
26
  #base_model = AutoModelForCausalLM.from_pretrained(base_model_name, quantization_config=bnb_config, device_map={"": device})
27
+ #base_model = AutoModelForCausalLM.from_pretrained(base_model_name, model_type="llama", device_map={"": device}, quantization="4bit")
28
+ base_model = AutoModelForCausalLM.from_pretrained(base_model_name, load_in_4bit=True, device_map={"": device}, torch_dtype=torch.float16)
29
 
30
 
31