rockylynnstein commited on
Commit
ed96669
·
verified ·
1 Parent(s): 7f6d813

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +1 -1
README.md CHANGED
@@ -48,7 +48,7 @@ import torch
48
  # Load model with FP8 quantization
49
  model = AutoModelForCausalLM.from_pretrained(
50
  "TevunahAi/NextCoder-14B-FP8",
51
- torch_dtype=torch.float8_e4m3fn, # FP8 dtype
52
  device_map="auto",
53
  low_cpu_mem_usage=True,
54
  )
 
48
  # Load model with FP8 quantization
49
  model = AutoModelForCausalLM.from_pretrained(
50
  "TevunahAi/NextCoder-14B-FP8",
51
+ torch_dtype=torch.bfloat16,
52
  device_map="auto",
53
  low_cpu_mem_usage=True,
54
  )