wfen
/

Cosmos3-Nano-FP8

Cosmos3OmniDiffusersPipeline

Model card Files Files and versions

Cosmos3-Nano-FP8 / quantization_config.json

wfen's picture

fix confliction

db04faa 15 days ago

History Blame Contribute Delete

586 Bytes

	{
	"recipe": "fp8",
	"weight_only": true,
	"quant_lmhead": true,
	"modelopt_artifact": "transformer/modelopt_quantized.pt",
	"loader": "Cosmos3OmniTransformer.from_config + modelopt.restore_from_modelopt_state + safetensors load_state_dict",
	"exclusions": [
	"embed_tokens",
	"norm",
	"time_embedder",
	"proj_in",
	"proj_out",
	"audio_*",
	"action_*"
	],
	"scale_layout": {
	"weight_scale_suffixes": [
	"_amax",
	"_scale"
	],
	"global_scale_suffixes": [],
	"n_weight": 802,
	"n_scale": 1010,
	"granularity": "per-tensor"
	}
	}