Spaces:

UCODE
/

agent

Sleeping

abenkbp commited on Aug 17, 2024

Commit

f8b336e

1 Parent(s): 372ab6a

debug

Files changed (1) hide show

data/models/llama3-1-70b.py CHANGED Viewed

@@ -16,7 +16,7 @@ model_id = "meta-llama/Meta-Llama-3.1-70B-Instruct"
 pipeline = transformers.pipeline(
     "text-generation",
     model=model_id,
-    model_kwargs={"torch_dtype": torch.bfloat16},
     device="cuda",
     token=True
 )

 pipeline = transformers.pipeline(
     "text-generation",
     model=model_id,
+    model_kwargs={"torch_dtype": torch.bfloat16,"quantization_config": {"load_in_4bit": True}},
     device="cuda",
     token=True
 )