Andreas99 commited on
Commit
6aea200
·
verified ·
1 Parent(s): cb37d55

Update src/litbench_pipeline.py

Browse files
Files changed (1) hide show
  1. src/litbench_pipeline.py +8 -1
src/litbench_pipeline.py CHANGED
@@ -622,9 +622,16 @@ if __name__ == "__main__":
622
  random.seed(seed_no)
623
 
624
 
 
 
 
 
 
 
 
625
  # Load model and tokenizer
626
  tokenizer = AutoTokenizer.from_pretrained(model_name)
627
- model = AutoModelForCausalLM.from_pretrained(model_name)
628
  if model.device.type != 'cuda':
629
  model.to('cuda')
630
 
 
622
  random.seed(seed_no)
623
 
624
 
625
+ # Load model and tokenizer
626
+ bnb_config = BitsAndBytesConfig(
627
+ load_in_8bit=True,
628
+ bnb_8bit_use_double_quant=True,
629
+ bnb_8bit_quant_type="nf8",
630
+ bnb_8bit_compute_dtype=torch.bfloat16
631
+ )
632
  # Load model and tokenizer
633
  tokenizer = AutoTokenizer.from_pretrained(model_name)
634
+ model = AutoModelForCausalLM.from_pretrained(model_name, quantization_config=bnb_config)
635
  if model.device.type != 'cuda':
636
  model.to('cuda')
637