Linseypass commited on
Commit
c2ce80d
·
1 Parent(s): c2acbb6

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -8
app.py CHANGED
@@ -16,14 +16,8 @@ adapters_name = 'timdettmers/guanaco-7b'
16
  # print(f"Starting to load the model {model_name} into memory")
17
  m = AutoModelForCausalLM.from_pretrained(
18
  model_name,
19
- torch_dtype=torch.bfloat16,
20
- quantization_config=BitsAndBytesConfig(
21
- load_in_4bit=True,
22
- bnb_4bit_compute_dtype=torch.bfloat16,
23
- bnb_4bit_use_double_quant=True,
24
- bnb_4bit_quant_type='nf4'
25
- ),
26
- )
27
  m = PeftModel.from_pretrained(m, adapters_name)
28
  m = m.merge_and_unload()
29
  tok = LlamaTokenizer.from_pretrained(model_name)
 
16
  # print(f"Starting to load the model {model_name} into memory")
17
  m = AutoModelForCausalLM.from_pretrained(
18
  model_name,
19
+ torch_dtype=torch.bfloat16)
20
+
 
 
 
 
 
 
21
  m = PeftModel.from_pretrained(m, adapters_name)
22
  m = m.merge_and_unload()
23
  tok = LlamaTokenizer.from_pretrained(model_name)