abenkbp commited on
Commit
f8b336e
·
1 Parent(s): 372ab6a
Files changed (1) hide show
  1. data/models/llama3-1-70b.py +1 -1
data/models/llama3-1-70b.py CHANGED
@@ -16,7 +16,7 @@ model_id = "meta-llama/Meta-Llama-3.1-70B-Instruct"
16
  pipeline = transformers.pipeline(
17
  "text-generation",
18
  model=model_id,
19
- model_kwargs={"torch_dtype": torch.bfloat16},
20
  device="cuda",
21
  token=True
22
  )
 
16
  pipeline = transformers.pipeline(
17
  "text-generation",
18
  model=model_id,
19
+ model_kwargs={"torch_dtype": torch.bfloat16,"quantization_config": {"load_in_4bit": True}},
20
  device="cuda",
21
  token=True
22
  )