Monimoy commited on
Commit
c7d8cf4
·
verified ·
1 Parent(s): 4c7bc10

Upload app.py

Browse files
Files changed (1) hide show
  1. app.py +8 -8
app.py CHANGED
@@ -17,14 +17,14 @@ peft_model_path = "./phi2-openassistant-lora-final"
17
  #base_model = AutoModelForCausalLM.from_pretrained(base_model_name, quantization_config=bnb_config, device_map={"": device})
18
  #base_model = AutoModelForCausalLM.from_pretrained(base_model_name, torch_dtype=torch.float32, device_map={"": device})
19
  #base_model = AutoModelForCausalLM.from_pretrained(base_model_name, load_in_4bit=True, device_map={"": device})
20
- bnb_config = BitsAndBytesConfig(
21
- load_in_4bit=True,
22
- bnb_4bit_compute_dtype=torch.float16,
23
- bnb_4bit_quant_type="nf4",
24
- bnb_4bit_use_double_quant=True,
25
- )
26
- base_model = AutoModelForCausalLM.from_pretrained(base_model_name, quantization_config=bnb_config, device_map={"": device})
27
-
28
 
29
 
30
 
 
17
  #base_model = AutoModelForCausalLM.from_pretrained(base_model_name, quantization_config=bnb_config, device_map={"": device})
18
  #base_model = AutoModelForCausalLM.from_pretrained(base_model_name, torch_dtype=torch.float32, device_map={"": device})
19
  #base_model = AutoModelForCausalLM.from_pretrained(base_model_name, load_in_4bit=True, device_map={"": device})
20
+ #bnb_config = BitsAndBytesConfig(
21
+ #load_in_4bit=True,
22
+ #bnb_4bit_compute_dtype=torch.float16,
23
+ #bnb_4bit_quant_type="nf4",
24
+ #bnb_4bit_use_double_quant=True,
25
+ #)
26
+ #base_model = AutoModelForCausalLM.from_pretrained(base_model_name, quantization_config=bnb_config, device_map={"": device})
27
+ base_model = AutoModelForCausalLM.from_pretrained(model_path, model_type="llama", device=device, quantization="4bit")
28
 
29
 
30