mansaripo commited on
Commit
43e4bf9
·
verified ·
1 Parent(s): 389961d

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +4 -2
README.md CHANGED
@@ -121,8 +121,10 @@ from transformers import AutoModelForCausalLM, AutoTokenizer
121
  model = AutoModelForCausalLM.from_pretrained(
122
  "daslab-testing/CloverLM",
123
  trust_remote_code=True,
124
- torch_dtype="bfloat16",
125
- )
 
 
126
  tokenizer = AutoTokenizer.from_pretrained(
127
  "daslab-testing/CloverLM",
128
  trust_remote_code=True,
 
121
  model = AutoModelForCausalLM.from_pretrained(
122
  "daslab-testing/CloverLM",
123
  trust_remote_code=True,
124
+ dtype="bfloat16",
125
+ quartet_2_impl="quartet2", # native NVFP4 kernel or "pseudoquant" on non-Blackwell GPUs
126
+ ).to("cuda") # for GPU usage or "cpu" for CPU usage
127
+
128
  tokenizer = AutoTokenizer.from_pretrained(
129
  "daslab-testing/CloverLM",
130
  trust_remote_code=True,