Cosmos3-Nano-FP8 / quantization_config.json
wfen's picture
fix confliction
db04faa
Raw
History Blame Contribute Delete
586 Bytes
{
"recipe": "fp8",
"weight_only": true,
"quant_lmhead": true,
"modelopt_artifact": "transformer/modelopt_quantized.pt",
"loader": "Cosmos3OmniTransformer.from_config + modelopt.restore_from_modelopt_state + safetensors load_state_dict",
"exclusions": [
"embed_tokens",
"*norm*",
"time_embedder",
"proj_in",
"proj_out",
"audio_*",
"action_*"
],
"scale_layout": {
"weight_scale_suffixes": [
"_amax",
"_scale"
],
"global_scale_suffixes": [],
"n_weight": 802,
"n_scale": 1010,
"granularity": "per-tensor"
}
}