Nick-2x commited on
Commit
6c16dfd
·
verified ·
1 Parent(s): f292e2b

Update app/main.py

Browse files
Files changed (1) hide show
  1. app/main.py +8 -1
app/main.py CHANGED
@@ -19,8 +19,15 @@ tokenizer = AutoTokenizer.from_pretrained(
19
 
20
  print("Loading model...")
21
 
 
 
 
 
22
  bnb_config = BitsAndBytesConfig(
23
- load_in_8bit=True
 
 
 
24
  )
25
 
26
  model = AutoModelForCausalLM.from_pretrained(
 
19
 
20
  print("Loading model...")
21
 
22
+ # bnb_config = BitsAndBytesConfig(
23
+ # load_in_8bit=True
24
+ # )
25
+
26
  bnb_config = BitsAndBytesConfig(
27
+ load_in_4bit=True,
28
+ bnb_4bit_compute_dtype=torch.bfloat16,
29
+ bnb_4bit_quant_type="nf4",
30
+ bnb_4bit_use_double_quant=True,
31
  )
32
 
33
  model = AutoModelForCausalLM.from_pretrained(