LTX-2-SDNQ-4bit-dynamic / transformer /quantization_config.json
Disty0's picture
Upload folder using huggingface_hub
c366ccb verified
{
"add_skip_keys": false,
"dequantize_fp32": false,
"dynamic_loss_threshold": 0.01,
"group_size": 0,
"is_integer": true,
"is_training": false,
"modules_dtype_dict": {
"float5_e3m1fn": [
"transformer_blocks.0.attn1.to_k.weight",
"transformer_blocks.0.attn1.to_v.weight",
"transformer_blocks.0.ff.net.2.weight",
"transformer_blocks.0.video_to_audio_attn.to_k.weight",
"transformer_blocks.0.video_to_audio_attn.to_v.weight",
"transformer_blocks.1.ff.net.0.proj.weight",
"transformer_blocks.3.ff.net.2.weight"
],
"int5": [
"transformer_blocks.0.attn1.to_q.weight",
"transformer_blocks.0.audio_attn1.to_k.weight",
"transformer_blocks.0.audio_attn1.to_out.0.weight",
"transformer_blocks.0.audio_attn1.to_q.weight",
"transformer_blocks.0.audio_attn1.to_v.weight",
"transformer_blocks.0.audio_attn2.to_out.0.weight",
"transformer_blocks.0.audio_attn2.to_q.weight",
"transformer_blocks.0.audio_ff.net.0.proj.weight",
"transformer_blocks.0.audio_to_video_attn.to_k.weight",
"transformer_blocks.0.audio_to_video_attn.to_q.weight",
"transformer_blocks.0.audio_to_video_attn.to_v.weight",
"transformer_blocks.0.ff.net.0.proj.weight",
"transformer_blocks.0.video_to_audio_attn.to_q.weight",
"transformer_blocks.1.attn1.to_k.weight",
"transformer_blocks.1.attn1.to_q.weight",
"transformer_blocks.1.attn1.to_v.weight",
"transformer_blocks.1.audio_attn1.to_k.weight",
"transformer_blocks.1.audio_attn1.to_q.weight",
"transformer_blocks.1.audio_attn1.to_v.weight",
"transformer_blocks.1.audio_attn2.to_q.weight",
"transformer_blocks.1.audio_ff.net.0.proj.weight",
"transformer_blocks.1.audio_ff.net.2.weight",
"transformer_blocks.1.audio_to_video_attn.to_k.weight",
"transformer_blocks.1.audio_to_video_attn.to_q.weight",
"transformer_blocks.1.audio_to_video_attn.to_v.weight",
"transformer_blocks.1.ff.net.2.weight",
"transformer_blocks.1.video_to_audio_attn.to_k.weight",
"transformer_blocks.1.video_to_audio_attn.to_q.weight",
"transformer_blocks.1.video_to_audio_attn.to_v.weight",
"transformer_blocks.2.attn1.to_k.weight",
"transformer_blocks.2.attn1.to_q.weight",
"transformer_blocks.2.attn1.to_v.weight",
"transformer_blocks.2.audio_attn1.to_k.weight",
"transformer_blocks.2.audio_attn1.to_q.weight",
"transformer_blocks.2.audio_attn1.to_v.weight",
"transformer_blocks.2.audio_attn2.to_q.weight",
"transformer_blocks.2.audio_ff.net.2.weight",
"transformer_blocks.2.audio_to_video_attn.to_k.weight",
"transformer_blocks.2.audio_to_video_attn.to_q.weight",
"transformer_blocks.2.audio_to_video_attn.to_v.weight",
"transformer_blocks.2.ff.net.0.proj.weight",
"transformer_blocks.2.ff.net.2.weight",
"transformer_blocks.2.video_to_audio_attn.to_k.weight",
"transformer_blocks.2.video_to_audio_attn.to_q.weight",
"transformer_blocks.2.video_to_audio_attn.to_v.weight",
"transformer_blocks.3.attn1.to_k.weight",
"transformer_blocks.3.attn1.to_v.weight",
"transformer_blocks.3.audio_attn1.to_k.weight",
"transformer_blocks.3.audio_attn1.to_v.weight",
"transformer_blocks.3.audio_attn2.to_q.weight",
"transformer_blocks.3.audio_ff.net.2.weight",
"transformer_blocks.3.audio_to_video_attn.to_k.weight",
"transformer_blocks.3.audio_to_video_attn.to_q.weight",
"transformer_blocks.3.audio_to_video_attn.to_v.weight",
"transformer_blocks.3.ff.net.0.proj.weight",
"transformer_blocks.3.video_to_audio_attn.to_k.weight",
"transformer_blocks.3.video_to_audio_attn.to_v.weight",
"transformer_blocks.4.attn1.to_v.weight",
"transformer_blocks.4.attn2.to_q.weight",
"transformer_blocks.4.audio_attn1.to_k.weight",
"transformer_blocks.4.audio_attn1.to_v.weight",
"transformer_blocks.4.audio_attn2.to_q.weight",
"transformer_blocks.4.audio_ff.net.2.weight",
"transformer_blocks.4.audio_to_video_attn.to_k.weight",
"transformer_blocks.4.audio_to_video_attn.to_v.weight",
"transformer_blocks.4.ff.net.0.proj.weight",
"transformer_blocks.4.ff.net.2.weight",
"transformer_blocks.4.video_to_audio_attn.to_k.weight",
"transformer_blocks.4.video_to_audio_attn.to_v.weight",
"transformer_blocks.5.attn1.to_k.weight",
"transformer_blocks.5.attn1.to_v.weight",
"transformer_blocks.5.audio_attn2.to_q.weight",
"transformer_blocks.5.audio_to_video_attn.to_q.weight",
"transformer_blocks.5.video_to_audio_attn.to_k.weight",
"transformer_blocks.5.video_to_audio_attn.to_v.weight",
"transformer_blocks.10.attn2.to_k.weight",
"transformer_blocks.10.attn2.to_q.weight",
"transformer_blocks.10.audio_ff.net.2.weight",
"transformer_blocks.10.ff.net.2.weight",
"transformer_blocks.11.attn2.to_k.weight",
"transformer_blocks.11.audio_ff.net.2.weight",
"transformer_blocks.11.ff.net.2.weight",
"transformer_blocks.5.audio_ff.net.2.weight",
"transformer_blocks.5.ff.net.2.weight",
"transformer_blocks.6.audio_attn2.to_q.weight",
"transformer_blocks.6.audio_ff.net.2.weight",
"transformer_blocks.6.ff.net.2.weight",
"transformer_blocks.7.attn2.to_k.weight",
"transformer_blocks.7.attn2.to_q.weight",
"transformer_blocks.7.audio_ff.net.2.weight",
"transformer_blocks.7.ff.net.2.weight",
"transformer_blocks.8.audio_attn1.to_v.weight",
"transformer_blocks.8.audio_ff.net.2.weight",
"transformer_blocks.8.ff.net.2.weight",
"transformer_blocks.9.attn1.to_v.weight",
"transformer_blocks.9.audio_ff.net.2.weight",
"transformer_blocks.9.ff.net.2.weight",
"transformer_blocks.12.attn1.to_v.weight",
"transformer_blocks.12.attn2.to_k.weight",
"transformer_blocks.12.audio_ff.net.2.weight",
"transformer_blocks.12.ff.net.2.weight",
"transformer_blocks.13.audio_ff.net.2.weight",
"transformer_blocks.13.ff.net.2.weight",
"transformer_blocks.14.audio_ff.net.2.weight",
"transformer_blocks.14.ff.net.2.weight",
"transformer_blocks.15.audio_ff.net.2.weight",
"transformer_blocks.15.ff.net.2.weight",
"transformer_blocks.16.audio_ff.net.2.weight",
"transformer_blocks.16.ff.net.2.weight",
"transformer_blocks.17.audio_ff.net.2.weight",
"transformer_blocks.17.ff.net.2.weight",
"transformer_blocks.18.attn2.to_k.weight",
"transformer_blocks.18.ff.net.2.weight",
"transformer_blocks.19.attn2.to_k.weight",
"transformer_blocks.19.ff.net.2.weight",
"transformer_blocks.20.attn2.to_k.weight",
"transformer_blocks.20.ff.net.2.weight",
"transformer_blocks.21.attn2.to_k.weight",
"transformer_blocks.22.attn2.to_k.weight",
"transformer_blocks.23.attn2.to_k.weight",
"transformer_blocks.23.attn2.to_v.weight",
"transformer_blocks.24.attn2.to_k.weight",
"transformer_blocks.24.attn2.to_v.weight",
"transformer_blocks.25.attn2.to_k.weight",
"transformer_blocks.25.attn2.to_v.weight",
"transformer_blocks.25.audio_attn1.to_v.weight",
"transformer_blocks.25.audio_to_video_attn.to_v.weight",
"transformer_blocks.26.attn2.to_k.weight",
"transformer_blocks.26.attn2.to_v.weight",
"transformer_blocks.27.attn2.to_k.weight",
"transformer_blocks.27.attn2.to_v.weight",
"transformer_blocks.27.audio_attn1.to_v.weight",
"transformer_blocks.27.audio_to_video_attn.to_v.weight",
"transformer_blocks.28.attn2.to_k.weight",
"transformer_blocks.28.audio_attn1.to_v.weight",
"transformer_blocks.29.attn1.to_k.weight",
"transformer_blocks.29.attn2.to_k.weight",
"transformer_blocks.29.attn2.to_q.weight",
"transformer_blocks.29.attn2.to_v.weight",
"transformer_blocks.29.video_to_audio_attn.to_v.weight",
"transformer_blocks.30.attn1.to_k.weight",
"transformer_blocks.30.attn2.to_k.weight",
"transformer_blocks.30.attn2.to_v.weight",
"transformer_blocks.31.attn1.to_k.weight",
"transformer_blocks.31.attn2.to_k.weight",
"transformer_blocks.31.attn2.to_v.weight",
"transformer_blocks.32.attn2.to_k.weight",
"transformer_blocks.32.attn2.to_v.weight",
"transformer_blocks.32.video_to_audio_attn.to_v.weight",
"transformer_blocks.33.attn1.to_k.weight",
"transformer_blocks.33.attn2.to_k.weight",
"transformer_blocks.33.attn2.to_v.weight",
"transformer_blocks.34.attn2.to_k.weight",
"transformer_blocks.34.attn2.to_out.0.weight",
"transformer_blocks.34.attn2.to_v.weight",
"transformer_blocks.35.attn2.to_k.weight",
"transformer_blocks.35.attn2.to_out.0.weight",
"transformer_blocks.35.attn2.to_v.weight",
"transformer_blocks.36.attn2.to_k.weight",
"transformer_blocks.36.attn2.to_out.0.weight",
"transformer_blocks.36.attn2.to_v.weight",
"transformer_blocks.36.audio_attn1.to_v.weight",
"transformer_blocks.36.audio_to_video_attn.to_v.weight",
"transformer_blocks.37.attn1.to_k.weight",
"transformer_blocks.37.attn1.to_v.weight",
"transformer_blocks.37.attn2.to_k.weight",
"transformer_blocks.37.attn2.to_out.0.weight",
"transformer_blocks.37.attn2.to_v.weight",
"transformer_blocks.38.attn1.to_k.weight",
"transformer_blocks.38.attn1.to_v.weight",
"transformer_blocks.38.attn2.to_k.weight",
"transformer_blocks.38.attn2.to_out.0.weight",
"transformer_blocks.38.attn2.to_v.weight",
"transformer_blocks.38.audio_attn1.to_v.weight",
"transformer_blocks.38.audio_to_video_attn.to_v.weight",
"transformer_blocks.39.attn1.to_k.weight",
"transformer_blocks.39.attn1.to_v.weight",
"transformer_blocks.39.attn2.to_k.weight",
"transformer_blocks.39.attn2.to_out.0.weight",
"transformer_blocks.39.attn2.to_v.weight",
"transformer_blocks.40.attn1.to_k.weight",
"transformer_blocks.40.attn1.to_v.weight",
"transformer_blocks.40.attn2.to_k.weight",
"transformer_blocks.40.attn2.to_out.0.weight",
"transformer_blocks.40.attn2.to_v.weight",
"transformer_blocks.40.video_to_audio_attn.to_k.weight",
"transformer_blocks.41.attn1.to_k.weight",
"transformer_blocks.41.attn1.to_v.weight",
"transformer_blocks.41.attn2.to_k.weight",
"transformer_blocks.41.attn2.to_out.0.weight",
"transformer_blocks.41.attn2.to_v.weight",
"transformer_blocks.41.audio_attn1.to_v.weight",
"transformer_blocks.41.audio_to_video_attn.to_v.weight",
"transformer_blocks.41.video_to_audio_attn.to_k.weight",
"transformer_blocks.42.attn1.to_k.weight",
"transformer_blocks.42.attn1.to_v.weight",
"transformer_blocks.42.attn2.to_k.weight",
"transformer_blocks.42.attn2.to_out.0.weight",
"transformer_blocks.42.attn2.to_v.weight",
"transformer_blocks.42.audio_ff.net.2.weight",
"transformer_blocks.42.audio_to_video_attn.to_v.weight",
"transformer_blocks.42.video_to_audio_attn.to_k.weight",
"transformer_blocks.43.attn1.to_k.weight",
"transformer_blocks.43.attn2.to_k.weight",
"transformer_blocks.43.attn2.to_out.0.weight",
"transformer_blocks.43.attn2.to_v.weight",
"transformer_blocks.43.audio_ff.net.2.weight",
"transformer_blocks.43.video_to_audio_attn.to_k.weight",
"transformer_blocks.44.attn1.to_k.weight",
"transformer_blocks.44.attn2.to_k.weight",
"transformer_blocks.44.attn2.to_out.0.weight",
"transformer_blocks.44.attn2.to_v.weight",
"transformer_blocks.44.audio_ff.net.2.weight",
"transformer_blocks.44.video_to_audio_attn.to_k.weight",
"transformer_blocks.45.attn1.to_k.weight",
"transformer_blocks.45.attn1.to_v.weight",
"transformer_blocks.45.attn2.to_k.weight",
"transformer_blocks.45.attn2.to_out.0.weight",
"transformer_blocks.45.attn2.to_v.weight",
"transformer_blocks.45.audio_ff.net.2.weight",
"transformer_blocks.45.video_to_audio_attn.to_k.weight",
"transformer_blocks.46.attn1.to_k.weight",
"transformer_blocks.46.attn1.to_v.weight",
"transformer_blocks.46.attn2.to_k.weight",
"transformer_blocks.46.attn2.to_out.0.weight",
"transformer_blocks.46.attn2.to_v.weight",
"transformer_blocks.46.audio_attn1.to_k.weight",
"transformer_blocks.46.audio_attn1.to_v.weight",
"transformer_blocks.46.audio_ff.net.2.weight",
"transformer_blocks.46.audio_to_video_attn.to_k.weight",
"transformer_blocks.46.audio_to_video_attn.to_v.weight",
"transformer_blocks.46.video_to_audio_attn.to_k.weight",
"transformer_blocks.47.attn1.to_k.weight",
"transformer_blocks.47.attn1.to_q.weight",
"transformer_blocks.47.attn1.to_v.weight",
"transformer_blocks.47.attn2.to_out.0.weight",
"transformer_blocks.47.attn2.to_v.weight",
"transformer_blocks.47.audio_attn1.to_v.weight",
"transformer_blocks.47.audio_attn2.to_out.0.weight",
"transformer_blocks.47.audio_ff.net.2.weight",
"transformer_blocks.47.audio_to_video_attn.to_q.weight",
"transformer_blocks.47.audio_to_video_attn.to_v.weight",
"transformer_blocks.47.ff.net.2.weight",
"transformer_blocks.47.video_to_audio_attn.to_k.weight",
"transformer_blocks.47.video_to_audio_attn.to_v.weight"
],
"uint4": [
"transformer_blocks.0.attn1.to_out.0.weight",
"transformer_blocks.0.attn2.to_k.weight",
"transformer_blocks.0.attn2.to_out.0.weight",
"transformer_blocks.0.attn2.to_q.weight",
"transformer_blocks.0.attn2.to_v.weight",
"transformer_blocks.0.audio_attn2.to_k.weight",
"transformer_blocks.0.audio_attn2.to_v.weight",
"transformer_blocks.0.audio_ff.net.2.weight",
"transformer_blocks.0.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.0.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.1.attn1.to_out.0.weight",
"transformer_blocks.1.attn2.to_k.weight",
"transformer_blocks.1.attn2.to_out.0.weight",
"transformer_blocks.1.attn2.to_q.weight",
"transformer_blocks.1.attn2.to_v.weight",
"transformer_blocks.1.audio_attn1.to_out.0.weight",
"transformer_blocks.1.audio_attn2.to_k.weight",
"transformer_blocks.1.audio_attn2.to_out.0.weight",
"transformer_blocks.1.audio_attn2.to_v.weight",
"transformer_blocks.1.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.1.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.2.attn1.to_out.0.weight",
"transformer_blocks.2.attn2.to_k.weight",
"transformer_blocks.2.attn2.to_out.0.weight",
"transformer_blocks.2.attn2.to_q.weight",
"transformer_blocks.2.attn2.to_v.weight",
"transformer_blocks.2.audio_attn1.to_out.0.weight",
"transformer_blocks.2.audio_attn2.to_k.weight",
"transformer_blocks.2.audio_attn2.to_out.0.weight",
"transformer_blocks.2.audio_attn2.to_v.weight",
"transformer_blocks.2.audio_ff.net.0.proj.weight",
"transformer_blocks.2.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.2.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.3.attn1.to_out.0.weight",
"transformer_blocks.3.attn1.to_q.weight",
"transformer_blocks.3.attn2.to_k.weight",
"transformer_blocks.3.attn2.to_out.0.weight",
"transformer_blocks.3.attn2.to_q.weight",
"transformer_blocks.3.attn2.to_v.weight",
"transformer_blocks.3.audio_attn1.to_out.0.weight",
"transformer_blocks.3.audio_attn1.to_q.weight",
"transformer_blocks.3.audio_attn2.to_k.weight",
"transformer_blocks.3.audio_attn2.to_out.0.weight",
"transformer_blocks.3.audio_attn2.to_v.weight",
"transformer_blocks.3.audio_ff.net.0.proj.weight",
"transformer_blocks.3.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.3.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.3.video_to_audio_attn.to_q.weight",
"transformer_blocks.4.attn1.to_k.weight",
"transformer_blocks.4.attn1.to_out.0.weight",
"transformer_blocks.4.attn1.to_q.weight",
"transformer_blocks.4.attn2.to_k.weight",
"transformer_blocks.4.attn2.to_out.0.weight",
"transformer_blocks.4.attn2.to_v.weight",
"transformer_blocks.4.audio_attn1.to_out.0.weight",
"transformer_blocks.4.audio_attn1.to_q.weight",
"transformer_blocks.4.audio_attn2.to_k.weight",
"transformer_blocks.4.audio_attn2.to_out.0.weight",
"transformer_blocks.4.audio_attn2.to_v.weight",
"transformer_blocks.4.audio_ff.net.0.proj.weight",
"transformer_blocks.4.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.4.audio_to_video_attn.to_q.weight",
"transformer_blocks.4.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.4.video_to_audio_attn.to_q.weight",
"transformer_blocks.5.attn1.to_out.0.weight",
"transformer_blocks.5.attn1.to_q.weight",
"transformer_blocks.5.attn2.to_k.weight",
"transformer_blocks.5.attn2.to_out.0.weight",
"transformer_blocks.5.attn2.to_q.weight",
"transformer_blocks.5.attn2.to_v.weight",
"transformer_blocks.5.audio_attn1.to_k.weight",
"transformer_blocks.5.audio_attn1.to_out.0.weight",
"transformer_blocks.5.audio_attn1.to_q.weight",
"transformer_blocks.5.audio_attn1.to_v.weight",
"transformer_blocks.5.audio_attn2.to_k.weight",
"transformer_blocks.5.audio_attn2.to_out.0.weight",
"transformer_blocks.5.audio_attn2.to_v.weight",
"transformer_blocks.5.audio_to_video_attn.to_k.weight",
"transformer_blocks.5.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.5.audio_to_video_attn.to_v.weight",
"transformer_blocks.5.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.5.video_to_audio_attn.to_q.weight",
"transformer_blocks.10.attn1.to_k.weight",
"transformer_blocks.10.attn1.to_out.0.weight",
"transformer_blocks.10.attn1.to_q.weight",
"transformer_blocks.10.attn1.to_v.weight",
"transformer_blocks.10.attn2.to_out.0.weight",
"transformer_blocks.10.attn2.to_v.weight",
"transformer_blocks.10.audio_attn1.to_k.weight",
"transformer_blocks.10.audio_attn1.to_out.0.weight",
"transformer_blocks.10.audio_attn1.to_q.weight",
"transformer_blocks.10.audio_attn1.to_v.weight",
"transformer_blocks.10.audio_attn2.to_k.weight",
"transformer_blocks.10.audio_attn2.to_out.0.weight",
"transformer_blocks.10.audio_attn2.to_q.weight",
"transformer_blocks.10.audio_attn2.to_v.weight",
"transformer_blocks.10.audio_ff.net.0.proj.weight",
"transformer_blocks.10.audio_to_video_attn.to_k.weight",
"transformer_blocks.10.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.10.audio_to_video_attn.to_q.weight",
"transformer_blocks.10.audio_to_video_attn.to_v.weight",
"transformer_blocks.10.ff.net.0.proj.weight",
"transformer_blocks.10.video_to_audio_attn.to_k.weight",
"transformer_blocks.10.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.10.video_to_audio_attn.to_q.weight",
"transformer_blocks.10.video_to_audio_attn.to_v.weight",
"transformer_blocks.11.attn1.to_k.weight",
"transformer_blocks.11.attn1.to_out.0.weight",
"transformer_blocks.11.attn1.to_q.weight",
"transformer_blocks.11.attn1.to_v.weight",
"transformer_blocks.11.attn2.to_out.0.weight",
"transformer_blocks.11.attn2.to_q.weight",
"transformer_blocks.11.attn2.to_v.weight",
"transformer_blocks.11.audio_attn1.to_k.weight",
"transformer_blocks.11.audio_attn1.to_out.0.weight",
"transformer_blocks.11.audio_attn1.to_q.weight",
"transformer_blocks.11.audio_attn1.to_v.weight",
"transformer_blocks.11.audio_attn2.to_k.weight",
"transformer_blocks.11.audio_attn2.to_out.0.weight",
"transformer_blocks.11.audio_attn2.to_q.weight",
"transformer_blocks.11.audio_attn2.to_v.weight",
"transformer_blocks.11.audio_ff.net.0.proj.weight",
"transformer_blocks.11.audio_to_video_attn.to_k.weight",
"transformer_blocks.11.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.11.audio_to_video_attn.to_q.weight",
"transformer_blocks.11.audio_to_video_attn.to_v.weight",
"transformer_blocks.11.ff.net.0.proj.weight",
"transformer_blocks.11.video_to_audio_attn.to_k.weight",
"transformer_blocks.11.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.11.video_to_audio_attn.to_q.weight",
"transformer_blocks.11.video_to_audio_attn.to_v.weight",
"transformer_blocks.5.audio_ff.net.0.proj.weight",
"transformer_blocks.5.ff.net.0.proj.weight",
"transformer_blocks.6.attn1.to_k.weight",
"transformer_blocks.6.attn1.to_out.0.weight",
"transformer_blocks.6.attn1.to_q.weight",
"transformer_blocks.6.attn1.to_v.weight",
"transformer_blocks.6.attn2.to_k.weight",
"transformer_blocks.6.attn2.to_out.0.weight",
"transformer_blocks.6.attn2.to_q.weight",
"transformer_blocks.6.attn2.to_v.weight",
"transformer_blocks.6.audio_attn1.to_k.weight",
"transformer_blocks.6.audio_attn1.to_out.0.weight",
"transformer_blocks.6.audio_attn1.to_q.weight",
"transformer_blocks.6.audio_attn1.to_v.weight",
"transformer_blocks.6.audio_attn2.to_k.weight",
"transformer_blocks.6.audio_attn2.to_out.0.weight",
"transformer_blocks.6.audio_attn2.to_v.weight",
"transformer_blocks.6.audio_ff.net.0.proj.weight",
"transformer_blocks.6.audio_to_video_attn.to_k.weight",
"transformer_blocks.6.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.6.audio_to_video_attn.to_q.weight",
"transformer_blocks.6.audio_to_video_attn.to_v.weight",
"transformer_blocks.6.ff.net.0.proj.weight",
"transformer_blocks.6.video_to_audio_attn.to_k.weight",
"transformer_blocks.6.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.6.video_to_audio_attn.to_q.weight",
"transformer_blocks.6.video_to_audio_attn.to_v.weight",
"transformer_blocks.7.attn1.to_k.weight",
"transformer_blocks.7.attn1.to_out.0.weight",
"transformer_blocks.7.attn1.to_q.weight",
"transformer_blocks.7.attn1.to_v.weight",
"transformer_blocks.7.attn2.to_out.0.weight",
"transformer_blocks.7.attn2.to_v.weight",
"transformer_blocks.7.audio_attn1.to_k.weight",
"transformer_blocks.7.audio_attn1.to_out.0.weight",
"transformer_blocks.7.audio_attn1.to_q.weight",
"transformer_blocks.7.audio_attn1.to_v.weight",
"transformer_blocks.7.audio_attn2.to_k.weight",
"transformer_blocks.7.audio_attn2.to_out.0.weight",
"transformer_blocks.7.audio_attn2.to_q.weight",
"transformer_blocks.7.audio_attn2.to_v.weight",
"transformer_blocks.7.audio_ff.net.0.proj.weight",
"transformer_blocks.7.audio_to_video_attn.to_k.weight",
"transformer_blocks.7.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.7.audio_to_video_attn.to_q.weight",
"transformer_blocks.7.audio_to_video_attn.to_v.weight",
"transformer_blocks.7.ff.net.0.proj.weight",
"transformer_blocks.7.video_to_audio_attn.to_k.weight",
"transformer_blocks.7.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.7.video_to_audio_attn.to_q.weight",
"transformer_blocks.7.video_to_audio_attn.to_v.weight",
"transformer_blocks.8.attn1.to_k.weight",
"transformer_blocks.8.attn1.to_out.0.weight",
"transformer_blocks.8.attn1.to_q.weight",
"transformer_blocks.8.attn1.to_v.weight",
"transformer_blocks.8.attn2.to_k.weight",
"transformer_blocks.8.attn2.to_out.0.weight",
"transformer_blocks.8.attn2.to_q.weight",
"transformer_blocks.8.attn2.to_v.weight",
"transformer_blocks.8.audio_attn1.to_k.weight",
"transformer_blocks.8.audio_attn1.to_out.0.weight",
"transformer_blocks.8.audio_attn1.to_q.weight",
"transformer_blocks.8.audio_attn2.to_k.weight",
"transformer_blocks.8.audio_attn2.to_out.0.weight",
"transformer_blocks.8.audio_attn2.to_q.weight",
"transformer_blocks.8.audio_attn2.to_v.weight",
"transformer_blocks.8.audio_ff.net.0.proj.weight",
"transformer_blocks.8.audio_to_video_attn.to_k.weight",
"transformer_blocks.8.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.8.audio_to_video_attn.to_q.weight",
"transformer_blocks.8.audio_to_video_attn.to_v.weight",
"transformer_blocks.8.ff.net.0.proj.weight",
"transformer_blocks.8.video_to_audio_attn.to_k.weight",
"transformer_blocks.8.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.8.video_to_audio_attn.to_q.weight",
"transformer_blocks.8.video_to_audio_attn.to_v.weight",
"transformer_blocks.9.attn1.to_k.weight",
"transformer_blocks.9.attn1.to_out.0.weight",
"transformer_blocks.9.attn1.to_q.weight",
"transformer_blocks.9.attn2.to_k.weight",
"transformer_blocks.9.attn2.to_out.0.weight",
"transformer_blocks.9.attn2.to_q.weight",
"transformer_blocks.9.attn2.to_v.weight",
"transformer_blocks.9.audio_attn1.to_k.weight",
"transformer_blocks.9.audio_attn1.to_out.0.weight",
"transformer_blocks.9.audio_attn1.to_q.weight",
"transformer_blocks.9.audio_attn1.to_v.weight",
"transformer_blocks.9.audio_attn2.to_k.weight",
"transformer_blocks.9.audio_attn2.to_out.0.weight",
"transformer_blocks.9.audio_attn2.to_q.weight",
"transformer_blocks.9.audio_attn2.to_v.weight",
"transformer_blocks.9.audio_ff.net.0.proj.weight",
"transformer_blocks.9.audio_to_video_attn.to_k.weight",
"transformer_blocks.9.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.9.audio_to_video_attn.to_q.weight",
"transformer_blocks.9.audio_to_video_attn.to_v.weight",
"transformer_blocks.9.ff.net.0.proj.weight",
"transformer_blocks.9.video_to_audio_attn.to_k.weight",
"transformer_blocks.9.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.9.video_to_audio_attn.to_q.weight",
"transformer_blocks.9.video_to_audio_attn.to_v.weight",
"transformer_blocks.12.attn1.to_k.weight",
"transformer_blocks.12.attn1.to_out.0.weight",
"transformer_blocks.12.attn1.to_q.weight",
"transformer_blocks.12.attn2.to_out.0.weight",
"transformer_blocks.12.attn2.to_q.weight",
"transformer_blocks.12.attn2.to_v.weight",
"transformer_blocks.12.audio_attn1.to_k.weight",
"transformer_blocks.12.audio_attn1.to_out.0.weight",
"transformer_blocks.12.audio_attn1.to_q.weight",
"transformer_blocks.12.audio_attn1.to_v.weight",
"transformer_blocks.12.audio_attn2.to_k.weight",
"transformer_blocks.12.audio_attn2.to_out.0.weight",
"transformer_blocks.12.audio_attn2.to_q.weight",
"transformer_blocks.12.audio_attn2.to_v.weight",
"transformer_blocks.12.audio_ff.net.0.proj.weight",
"transformer_blocks.12.audio_to_video_attn.to_k.weight",
"transformer_blocks.12.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.12.audio_to_video_attn.to_q.weight",
"transformer_blocks.12.audio_to_video_attn.to_v.weight",
"transformer_blocks.12.ff.net.0.proj.weight",
"transformer_blocks.12.video_to_audio_attn.to_k.weight",
"transformer_blocks.12.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.12.video_to_audio_attn.to_q.weight",
"transformer_blocks.12.video_to_audio_attn.to_v.weight",
"transformer_blocks.13.attn1.to_k.weight",
"transformer_blocks.13.attn1.to_out.0.weight",
"transformer_blocks.13.attn1.to_q.weight",
"transformer_blocks.13.attn1.to_v.weight",
"transformer_blocks.13.attn2.to_k.weight",
"transformer_blocks.13.attn2.to_out.0.weight",
"transformer_blocks.13.attn2.to_q.weight",
"transformer_blocks.13.attn2.to_v.weight",
"transformer_blocks.13.audio_attn1.to_k.weight",
"transformer_blocks.13.audio_attn1.to_out.0.weight",
"transformer_blocks.13.audio_attn1.to_q.weight",
"transformer_blocks.13.audio_attn1.to_v.weight",
"transformer_blocks.13.audio_attn2.to_k.weight",
"transformer_blocks.13.audio_attn2.to_out.0.weight",
"transformer_blocks.13.audio_attn2.to_q.weight",
"transformer_blocks.13.audio_attn2.to_v.weight",
"transformer_blocks.13.audio_ff.net.0.proj.weight",
"transformer_blocks.13.audio_to_video_attn.to_k.weight",
"transformer_blocks.13.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.13.audio_to_video_attn.to_q.weight",
"transformer_blocks.13.audio_to_video_attn.to_v.weight",
"transformer_blocks.13.ff.net.0.proj.weight",
"transformer_blocks.13.video_to_audio_attn.to_k.weight",
"transformer_blocks.13.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.13.video_to_audio_attn.to_q.weight",
"transformer_blocks.13.video_to_audio_attn.to_v.weight",
"transformer_blocks.14.attn1.to_k.weight",
"transformer_blocks.14.attn1.to_out.0.weight",
"transformer_blocks.14.attn1.to_q.weight",
"transformer_blocks.14.attn1.to_v.weight",
"transformer_blocks.14.attn2.to_k.weight",
"transformer_blocks.14.attn2.to_out.0.weight",
"transformer_blocks.14.attn2.to_q.weight",
"transformer_blocks.14.attn2.to_v.weight",
"transformer_blocks.14.audio_attn1.to_k.weight",
"transformer_blocks.14.audio_attn1.to_out.0.weight",
"transformer_blocks.14.audio_attn1.to_q.weight",
"transformer_blocks.14.audio_attn1.to_v.weight",
"transformer_blocks.14.audio_attn2.to_k.weight",
"transformer_blocks.14.audio_attn2.to_out.0.weight",
"transformer_blocks.14.audio_attn2.to_q.weight",
"transformer_blocks.14.audio_attn2.to_v.weight",
"transformer_blocks.14.audio_ff.net.0.proj.weight",
"transformer_blocks.14.audio_to_video_attn.to_k.weight",
"transformer_blocks.14.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.14.audio_to_video_attn.to_q.weight",
"transformer_blocks.14.audio_to_video_attn.to_v.weight",
"transformer_blocks.14.ff.net.0.proj.weight",
"transformer_blocks.14.video_to_audio_attn.to_k.weight",
"transformer_blocks.14.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.14.video_to_audio_attn.to_q.weight",
"transformer_blocks.14.video_to_audio_attn.to_v.weight",
"transformer_blocks.15.attn1.to_k.weight",
"transformer_blocks.15.attn1.to_out.0.weight",
"transformer_blocks.15.attn1.to_q.weight",
"transformer_blocks.15.attn1.to_v.weight",
"transformer_blocks.15.attn2.to_k.weight",
"transformer_blocks.15.attn2.to_out.0.weight",
"transformer_blocks.15.attn2.to_q.weight",
"transformer_blocks.15.attn2.to_v.weight",
"transformer_blocks.15.audio_attn1.to_k.weight",
"transformer_blocks.15.audio_attn1.to_out.0.weight",
"transformer_blocks.15.audio_attn1.to_q.weight",
"transformer_blocks.15.audio_attn1.to_v.weight",
"transformer_blocks.15.audio_attn2.to_k.weight",
"transformer_blocks.15.audio_attn2.to_out.0.weight",
"transformer_blocks.15.audio_attn2.to_q.weight",
"transformer_blocks.15.audio_attn2.to_v.weight",
"transformer_blocks.15.audio_ff.net.0.proj.weight",
"transformer_blocks.15.audio_to_video_attn.to_k.weight",
"transformer_blocks.15.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.15.audio_to_video_attn.to_q.weight",
"transformer_blocks.15.audio_to_video_attn.to_v.weight",
"transformer_blocks.15.ff.net.0.proj.weight",
"transformer_blocks.15.video_to_audio_attn.to_k.weight",
"transformer_blocks.15.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.15.video_to_audio_attn.to_q.weight",
"transformer_blocks.15.video_to_audio_attn.to_v.weight",
"transformer_blocks.16.attn1.to_k.weight",
"transformer_blocks.16.attn1.to_out.0.weight",
"transformer_blocks.16.attn1.to_q.weight",
"transformer_blocks.16.attn1.to_v.weight",
"transformer_blocks.16.attn2.to_k.weight",
"transformer_blocks.16.attn2.to_out.0.weight",
"transformer_blocks.16.attn2.to_q.weight",
"transformer_blocks.16.attn2.to_v.weight",
"transformer_blocks.16.audio_attn1.to_k.weight",
"transformer_blocks.16.audio_attn1.to_out.0.weight",
"transformer_blocks.16.audio_attn1.to_q.weight",
"transformer_blocks.16.audio_attn1.to_v.weight",
"transformer_blocks.16.audio_attn2.to_k.weight",
"transformer_blocks.16.audio_attn2.to_out.0.weight",
"transformer_blocks.16.audio_attn2.to_q.weight",
"transformer_blocks.16.audio_attn2.to_v.weight",
"transformer_blocks.16.audio_ff.net.0.proj.weight",
"transformer_blocks.16.audio_to_video_attn.to_k.weight",
"transformer_blocks.16.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.16.audio_to_video_attn.to_q.weight",
"transformer_blocks.16.audio_to_video_attn.to_v.weight",
"transformer_blocks.16.ff.net.0.proj.weight",
"transformer_blocks.16.video_to_audio_attn.to_k.weight",
"transformer_blocks.16.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.16.video_to_audio_attn.to_q.weight",
"transformer_blocks.16.video_to_audio_attn.to_v.weight",
"transformer_blocks.17.attn1.to_k.weight",
"transformer_blocks.17.attn1.to_out.0.weight",
"transformer_blocks.17.attn1.to_q.weight",
"transformer_blocks.17.attn1.to_v.weight",
"transformer_blocks.17.attn2.to_k.weight",
"transformer_blocks.17.attn2.to_out.0.weight",
"transformer_blocks.17.attn2.to_q.weight",
"transformer_blocks.17.attn2.to_v.weight",
"transformer_blocks.17.audio_attn1.to_k.weight",
"transformer_blocks.17.audio_attn1.to_out.0.weight",
"transformer_blocks.17.audio_attn1.to_q.weight",
"transformer_blocks.17.audio_attn1.to_v.weight",
"transformer_blocks.17.audio_attn2.to_k.weight",
"transformer_blocks.17.audio_attn2.to_out.0.weight",
"transformer_blocks.17.audio_attn2.to_q.weight",
"transformer_blocks.17.audio_attn2.to_v.weight",
"transformer_blocks.17.audio_ff.net.0.proj.weight",
"transformer_blocks.17.audio_to_video_attn.to_k.weight",
"transformer_blocks.17.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.17.audio_to_video_attn.to_q.weight",
"transformer_blocks.17.audio_to_video_attn.to_v.weight",
"transformer_blocks.17.ff.net.0.proj.weight",
"transformer_blocks.17.video_to_audio_attn.to_k.weight",
"transformer_blocks.17.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.17.video_to_audio_attn.to_q.weight",
"transformer_blocks.17.video_to_audio_attn.to_v.weight",
"transformer_blocks.18.attn1.to_k.weight",
"transformer_blocks.18.attn1.to_out.0.weight",
"transformer_blocks.18.attn1.to_q.weight",
"transformer_blocks.18.attn1.to_v.weight",
"transformer_blocks.18.attn2.to_out.0.weight",
"transformer_blocks.18.attn2.to_q.weight",
"transformer_blocks.18.attn2.to_v.weight",
"transformer_blocks.18.audio_attn1.to_k.weight",
"transformer_blocks.18.audio_attn1.to_out.0.weight",
"transformer_blocks.18.audio_attn1.to_q.weight",
"transformer_blocks.18.audio_attn1.to_v.weight",
"transformer_blocks.18.audio_attn2.to_k.weight",
"transformer_blocks.18.audio_attn2.to_out.0.weight",
"transformer_blocks.18.audio_attn2.to_q.weight",
"transformer_blocks.18.audio_attn2.to_v.weight",
"transformer_blocks.18.audio_to_video_attn.to_k.weight",
"transformer_blocks.18.audio_to_video_attn.to_q.weight",
"transformer_blocks.18.audio_ff.net.0.proj.weight",
"transformer_blocks.18.audio_ff.net.2.weight",
"transformer_blocks.18.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.18.audio_to_video_attn.to_v.weight",
"transformer_blocks.18.ff.net.0.proj.weight",
"transformer_blocks.18.video_to_audio_attn.to_k.weight",
"transformer_blocks.18.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.18.video_to_audio_attn.to_q.weight",
"transformer_blocks.18.video_to_audio_attn.to_v.weight",
"transformer_blocks.19.attn1.to_k.weight",
"transformer_blocks.19.attn1.to_out.0.weight",
"transformer_blocks.19.attn1.to_q.weight",
"transformer_blocks.19.attn1.to_v.weight",
"transformer_blocks.19.attn2.to_out.0.weight",
"transformer_blocks.19.attn2.to_q.weight",
"transformer_blocks.19.attn2.to_v.weight",
"transformer_blocks.19.audio_attn1.to_k.weight",
"transformer_blocks.19.audio_attn1.to_out.0.weight",
"transformer_blocks.19.audio_attn1.to_q.weight",
"transformer_blocks.19.audio_attn1.to_v.weight",
"transformer_blocks.19.audio_attn2.to_k.weight",
"transformer_blocks.19.audio_attn2.to_out.0.weight",
"transformer_blocks.19.audio_attn2.to_q.weight",
"transformer_blocks.19.audio_attn2.to_v.weight",
"transformer_blocks.19.audio_ff.net.0.proj.weight",
"transformer_blocks.19.audio_ff.net.2.weight",
"transformer_blocks.19.audio_to_video_attn.to_k.weight",
"transformer_blocks.19.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.19.audio_to_video_attn.to_q.weight",
"transformer_blocks.19.audio_to_video_attn.to_v.weight",
"transformer_blocks.19.ff.net.0.proj.weight",
"transformer_blocks.19.video_to_audio_attn.to_k.weight",
"transformer_blocks.19.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.19.video_to_audio_attn.to_q.weight",
"transformer_blocks.19.video_to_audio_attn.to_v.weight",
"transformer_blocks.20.attn1.to_k.weight",
"transformer_blocks.20.attn1.to_out.0.weight",
"transformer_blocks.20.attn1.to_q.weight",
"transformer_blocks.20.attn1.to_v.weight",
"transformer_blocks.20.attn2.to_out.0.weight",
"transformer_blocks.20.attn2.to_q.weight",
"transformer_blocks.20.attn2.to_v.weight",
"transformer_blocks.20.audio_attn1.to_k.weight",
"transformer_blocks.20.audio_attn1.to_out.0.weight",
"transformer_blocks.20.audio_attn1.to_q.weight",
"transformer_blocks.20.audio_attn1.to_v.weight",
"transformer_blocks.20.audio_attn2.to_k.weight",
"transformer_blocks.20.audio_attn2.to_out.0.weight",
"transformer_blocks.20.audio_attn2.to_q.weight",
"transformer_blocks.20.audio_attn2.to_v.weight",
"transformer_blocks.20.audio_ff.net.0.proj.weight",
"transformer_blocks.20.audio_ff.net.2.weight",
"transformer_blocks.20.audio_to_video_attn.to_k.weight",
"transformer_blocks.20.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.20.audio_to_video_attn.to_q.weight",
"transformer_blocks.20.audio_to_video_attn.to_v.weight",
"transformer_blocks.20.ff.net.0.proj.weight",
"transformer_blocks.20.video_to_audio_attn.to_k.weight",
"transformer_blocks.20.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.20.video_to_audio_attn.to_q.weight",
"transformer_blocks.20.video_to_audio_attn.to_v.weight",
"transformer_blocks.21.attn1.to_k.weight",
"transformer_blocks.21.attn1.to_out.0.weight",
"transformer_blocks.21.attn1.to_q.weight",
"transformer_blocks.21.attn1.to_v.weight",
"transformer_blocks.21.attn2.to_out.0.weight",
"transformer_blocks.21.attn2.to_q.weight",
"transformer_blocks.21.attn2.to_v.weight",
"transformer_blocks.21.audio_attn1.to_k.weight",
"transformer_blocks.21.audio_attn1.to_out.0.weight",
"transformer_blocks.21.audio_attn1.to_q.weight",
"transformer_blocks.21.audio_attn1.to_v.weight",
"transformer_blocks.21.audio_attn2.to_k.weight",
"transformer_blocks.21.audio_attn2.to_out.0.weight",
"transformer_blocks.21.audio_attn2.to_q.weight",
"transformer_blocks.21.audio_attn2.to_v.weight",
"transformer_blocks.21.audio_ff.net.0.proj.weight",
"transformer_blocks.21.audio_ff.net.2.weight",
"transformer_blocks.21.audio_to_video_attn.to_k.weight",
"transformer_blocks.21.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.21.audio_to_video_attn.to_q.weight",
"transformer_blocks.21.audio_to_video_attn.to_v.weight",
"transformer_blocks.21.ff.net.0.proj.weight",
"transformer_blocks.21.ff.net.2.weight",
"transformer_blocks.21.video_to_audio_attn.to_k.weight",
"transformer_blocks.21.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.21.video_to_audio_attn.to_q.weight",
"transformer_blocks.21.video_to_audio_attn.to_v.weight",
"transformer_blocks.22.attn1.to_k.weight",
"transformer_blocks.22.attn1.to_out.0.weight",
"transformer_blocks.22.attn1.to_q.weight",
"transformer_blocks.22.attn1.to_v.weight",
"transformer_blocks.22.attn2.to_out.0.weight",
"transformer_blocks.22.attn2.to_q.weight",
"transformer_blocks.22.attn2.to_v.weight",
"transformer_blocks.22.audio_attn1.to_k.weight",
"transformer_blocks.22.audio_attn1.to_out.0.weight",
"transformer_blocks.22.audio_attn1.to_q.weight",
"transformer_blocks.22.audio_attn1.to_v.weight",
"transformer_blocks.22.audio_attn2.to_k.weight",
"transformer_blocks.22.audio_attn2.to_out.0.weight",
"transformer_blocks.22.audio_attn2.to_q.weight",
"transformer_blocks.22.audio_attn2.to_v.weight",
"transformer_blocks.22.audio_ff.net.0.proj.weight",
"transformer_blocks.22.audio_ff.net.2.weight",
"transformer_blocks.22.audio_to_video_attn.to_k.weight",
"transformer_blocks.22.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.22.audio_to_video_attn.to_q.weight",
"transformer_blocks.22.audio_to_video_attn.to_v.weight",
"transformer_blocks.22.ff.net.0.proj.weight",
"transformer_blocks.22.ff.net.2.weight",
"transformer_blocks.22.video_to_audio_attn.to_k.weight",
"transformer_blocks.22.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.22.video_to_audio_attn.to_q.weight",
"transformer_blocks.22.video_to_audio_attn.to_v.weight",
"transformer_blocks.23.attn1.to_k.weight",
"transformer_blocks.23.attn1.to_out.0.weight",
"transformer_blocks.23.attn1.to_q.weight",
"transformer_blocks.23.attn1.to_v.weight",
"transformer_blocks.23.attn2.to_out.0.weight",
"transformer_blocks.23.attn2.to_q.weight",
"transformer_blocks.23.audio_attn1.to_k.weight",
"transformer_blocks.23.audio_attn1.to_out.0.weight",
"transformer_blocks.23.audio_attn1.to_q.weight",
"transformer_blocks.23.audio_attn1.to_v.weight",
"transformer_blocks.23.audio_attn2.to_k.weight",
"transformer_blocks.23.audio_attn2.to_out.0.weight",
"transformer_blocks.23.audio_attn2.to_q.weight",
"transformer_blocks.23.audio_attn2.to_v.weight",
"transformer_blocks.23.audio_ff.net.0.proj.weight",
"transformer_blocks.23.audio_ff.net.2.weight",
"transformer_blocks.23.audio_to_video_attn.to_k.weight",
"transformer_blocks.23.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.23.audio_to_video_attn.to_q.weight",
"transformer_blocks.23.audio_to_video_attn.to_v.weight",
"transformer_blocks.23.ff.net.0.proj.weight",
"transformer_blocks.23.ff.net.2.weight",
"transformer_blocks.23.video_to_audio_attn.to_k.weight",
"transformer_blocks.23.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.23.video_to_audio_attn.to_q.weight",
"transformer_blocks.23.video_to_audio_attn.to_v.weight",
"transformer_blocks.24.attn1.to_k.weight",
"transformer_blocks.24.attn1.to_out.0.weight",
"transformer_blocks.24.attn1.to_q.weight",
"transformer_blocks.24.attn1.to_v.weight",
"transformer_blocks.24.attn2.to_out.0.weight",
"transformer_blocks.24.attn2.to_q.weight",
"transformer_blocks.24.audio_attn1.to_k.weight",
"transformer_blocks.24.audio_attn1.to_out.0.weight",
"transformer_blocks.24.audio_attn1.to_q.weight",
"transformer_blocks.24.audio_attn1.to_v.weight",
"transformer_blocks.24.audio_attn2.to_k.weight",
"transformer_blocks.24.audio_attn2.to_out.0.weight",
"transformer_blocks.24.audio_attn2.to_q.weight",
"transformer_blocks.24.audio_attn2.to_v.weight",
"transformer_blocks.24.audio_to_video_attn.to_k.weight",
"transformer_blocks.24.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.24.audio_to_video_attn.to_q.weight",
"transformer_blocks.24.audio_to_video_attn.to_v.weight",
"transformer_blocks.24.ff.net.0.proj.weight",
"transformer_blocks.24.ff.net.2.weight",
"transformer_blocks.24.video_to_audio_attn.to_k.weight",
"transformer_blocks.24.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.24.video_to_audio_attn.to_q.weight",
"transformer_blocks.24.video_to_audio_attn.to_v.weight",
"transformer_blocks.24.audio_ff.net.0.proj.weight",
"transformer_blocks.24.audio_ff.net.2.weight",
"transformer_blocks.25.attn1.to_k.weight",
"transformer_blocks.25.attn1.to_out.0.weight",
"transformer_blocks.25.attn1.to_q.weight",
"transformer_blocks.25.attn1.to_v.weight",
"transformer_blocks.25.attn2.to_out.0.weight",
"transformer_blocks.25.attn2.to_q.weight",
"transformer_blocks.25.audio_attn1.to_k.weight",
"transformer_blocks.25.audio_attn1.to_out.0.weight",
"transformer_blocks.25.audio_attn1.to_q.weight",
"transformer_blocks.25.audio_attn2.to_k.weight",
"transformer_blocks.25.audio_attn2.to_out.0.weight",
"transformer_blocks.25.audio_attn2.to_q.weight",
"transformer_blocks.25.audio_attn2.to_v.weight",
"transformer_blocks.25.audio_ff.net.0.proj.weight",
"transformer_blocks.25.audio_ff.net.2.weight",
"transformer_blocks.25.audio_to_video_attn.to_k.weight",
"transformer_blocks.25.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.25.audio_to_video_attn.to_q.weight",
"transformer_blocks.25.ff.net.0.proj.weight",
"transformer_blocks.25.ff.net.2.weight",
"transformer_blocks.25.video_to_audio_attn.to_k.weight",
"transformer_blocks.25.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.25.video_to_audio_attn.to_q.weight",
"transformer_blocks.25.video_to_audio_attn.to_v.weight",
"transformer_blocks.26.attn1.to_k.weight",
"transformer_blocks.26.attn1.to_out.0.weight",
"transformer_blocks.26.attn1.to_q.weight",
"transformer_blocks.26.attn1.to_v.weight",
"transformer_blocks.26.attn2.to_out.0.weight",
"transformer_blocks.26.attn2.to_q.weight",
"transformer_blocks.26.audio_attn1.to_k.weight",
"transformer_blocks.26.audio_attn1.to_out.0.weight",
"transformer_blocks.26.audio_attn1.to_q.weight",
"transformer_blocks.26.audio_attn1.to_v.weight",
"transformer_blocks.26.audio_attn2.to_k.weight",
"transformer_blocks.26.audio_attn2.to_out.0.weight",
"transformer_blocks.26.audio_attn2.to_q.weight",
"transformer_blocks.26.audio_attn2.to_v.weight",
"transformer_blocks.26.audio_ff.net.0.proj.weight",
"transformer_blocks.26.audio_ff.net.2.weight",
"transformer_blocks.26.audio_to_video_attn.to_k.weight",
"transformer_blocks.26.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.26.audio_to_video_attn.to_q.weight",
"transformer_blocks.26.audio_to_video_attn.to_v.weight",
"transformer_blocks.26.ff.net.0.proj.weight",
"transformer_blocks.26.ff.net.2.weight",
"transformer_blocks.26.video_to_audio_attn.to_k.weight",
"transformer_blocks.26.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.26.video_to_audio_attn.to_q.weight",
"transformer_blocks.26.video_to_audio_attn.to_v.weight",
"transformer_blocks.27.attn1.to_k.weight",
"transformer_blocks.27.attn1.to_out.0.weight",
"transformer_blocks.27.attn1.to_q.weight",
"transformer_blocks.27.attn1.to_v.weight",
"transformer_blocks.27.attn2.to_out.0.weight",
"transformer_blocks.27.attn2.to_q.weight",
"transformer_blocks.27.audio_attn1.to_k.weight",
"transformer_blocks.27.audio_attn1.to_out.0.weight",
"transformer_blocks.27.audio_attn1.to_q.weight",
"transformer_blocks.27.audio_attn2.to_k.weight",
"transformer_blocks.27.audio_attn2.to_out.0.weight",
"transformer_blocks.27.audio_attn2.to_q.weight",
"transformer_blocks.27.audio_attn2.to_v.weight",
"transformer_blocks.27.audio_ff.net.0.proj.weight",
"transformer_blocks.27.audio_ff.net.2.weight",
"transformer_blocks.27.audio_to_video_attn.to_k.weight",
"transformer_blocks.27.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.27.audio_to_video_attn.to_q.weight",
"transformer_blocks.27.ff.net.0.proj.weight",
"transformer_blocks.27.ff.net.2.weight",
"transformer_blocks.27.video_to_audio_attn.to_k.weight",
"transformer_blocks.27.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.27.video_to_audio_attn.to_q.weight",
"transformer_blocks.27.video_to_audio_attn.to_v.weight",
"transformer_blocks.28.attn1.to_k.weight",
"transformer_blocks.28.attn1.to_out.0.weight",
"transformer_blocks.28.attn1.to_q.weight",
"transformer_blocks.28.attn1.to_v.weight",
"transformer_blocks.28.attn2.to_out.0.weight",
"transformer_blocks.28.attn2.to_q.weight",
"transformer_blocks.28.attn2.to_v.weight",
"transformer_blocks.28.audio_attn1.to_k.weight",
"transformer_blocks.28.audio_attn1.to_out.0.weight",
"transformer_blocks.28.audio_attn1.to_q.weight",
"transformer_blocks.28.audio_attn2.to_k.weight",
"transformer_blocks.28.audio_attn2.to_out.0.weight",
"transformer_blocks.28.audio_attn2.to_q.weight",
"transformer_blocks.28.audio_attn2.to_v.weight",
"transformer_blocks.28.audio_ff.net.0.proj.weight",
"transformer_blocks.28.audio_ff.net.2.weight",
"transformer_blocks.28.audio_to_video_attn.to_k.weight",
"transformer_blocks.28.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.28.audio_to_video_attn.to_q.weight",
"transformer_blocks.28.audio_to_video_attn.to_v.weight",
"transformer_blocks.28.ff.net.0.proj.weight",
"transformer_blocks.28.ff.net.2.weight",
"transformer_blocks.28.video_to_audio_attn.to_k.weight",
"transformer_blocks.28.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.28.video_to_audio_attn.to_q.weight",
"transformer_blocks.28.video_to_audio_attn.to_v.weight",
"transformer_blocks.29.attn1.to_out.0.weight",
"transformer_blocks.29.attn1.to_q.weight",
"transformer_blocks.29.attn1.to_v.weight",
"transformer_blocks.29.attn2.to_out.0.weight",
"transformer_blocks.29.audio_attn1.to_k.weight",
"transformer_blocks.29.audio_attn1.to_out.0.weight",
"transformer_blocks.29.audio_attn1.to_q.weight",
"transformer_blocks.29.audio_attn1.to_v.weight",
"transformer_blocks.29.audio_attn2.to_k.weight",
"transformer_blocks.29.audio_attn2.to_out.0.weight",
"transformer_blocks.29.audio_attn2.to_q.weight",
"transformer_blocks.29.audio_attn2.to_v.weight",
"transformer_blocks.29.audio_ff.net.0.proj.weight",
"transformer_blocks.29.audio_ff.net.2.weight",
"transformer_blocks.29.audio_to_video_attn.to_k.weight",
"transformer_blocks.29.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.29.audio_to_video_attn.to_q.weight",
"transformer_blocks.29.audio_to_video_attn.to_v.weight",
"transformer_blocks.29.ff.net.0.proj.weight",
"transformer_blocks.29.ff.net.2.weight",
"transformer_blocks.29.video_to_audio_attn.to_k.weight",
"transformer_blocks.29.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.29.video_to_audio_attn.to_q.weight",
"transformer_blocks.30.attn1.to_out.0.weight",
"transformer_blocks.30.attn1.to_q.weight",
"transformer_blocks.30.attn1.to_v.weight",
"transformer_blocks.30.attn2.to_out.0.weight",
"transformer_blocks.30.attn2.to_q.weight",
"transformer_blocks.30.audio_attn1.to_k.weight",
"transformer_blocks.30.audio_attn1.to_out.0.weight",
"transformer_blocks.30.audio_attn1.to_q.weight",
"transformer_blocks.30.audio_attn1.to_v.weight",
"transformer_blocks.30.audio_attn2.to_k.weight",
"transformer_blocks.30.audio_attn2.to_out.0.weight",
"transformer_blocks.30.audio_attn2.to_q.weight",
"transformer_blocks.30.audio_attn2.to_v.weight",
"transformer_blocks.30.audio_ff.net.0.proj.weight",
"transformer_blocks.30.audio_ff.net.2.weight",
"transformer_blocks.30.audio_to_video_attn.to_k.weight",
"transformer_blocks.30.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.30.audio_to_video_attn.to_q.weight",
"transformer_blocks.30.audio_to_video_attn.to_v.weight",
"transformer_blocks.30.ff.net.0.proj.weight",
"transformer_blocks.30.ff.net.2.weight",
"transformer_blocks.30.video_to_audio_attn.to_k.weight",
"transformer_blocks.30.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.30.video_to_audio_attn.to_q.weight",
"transformer_blocks.30.video_to_audio_attn.to_v.weight",
"transformer_blocks.31.attn1.to_out.0.weight",
"transformer_blocks.31.attn1.to_q.weight",
"transformer_blocks.31.attn1.to_v.weight",
"transformer_blocks.31.attn2.to_q.weight",
"transformer_blocks.31.audio_attn1.to_k.weight",
"transformer_blocks.31.audio_attn1.to_out.0.weight",
"transformer_blocks.31.audio_attn1.to_q.weight",
"transformer_blocks.31.audio_attn1.to_v.weight",
"transformer_blocks.31.attn2.to_out.0.weight",
"transformer_blocks.31.audio_attn2.to_k.weight",
"transformer_blocks.31.audio_attn2.to_out.0.weight",
"transformer_blocks.31.audio_attn2.to_q.weight",
"transformer_blocks.31.audio_attn2.to_v.weight",
"transformer_blocks.31.audio_ff.net.0.proj.weight",
"transformer_blocks.31.audio_ff.net.2.weight",
"transformer_blocks.31.audio_to_video_attn.to_k.weight",
"transformer_blocks.31.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.31.audio_to_video_attn.to_q.weight",
"transformer_blocks.31.audio_to_video_attn.to_v.weight",
"transformer_blocks.31.ff.net.0.proj.weight",
"transformer_blocks.31.ff.net.2.weight",
"transformer_blocks.31.video_to_audio_attn.to_k.weight",
"transformer_blocks.31.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.31.video_to_audio_attn.to_q.weight",
"transformer_blocks.31.video_to_audio_attn.to_v.weight",
"transformer_blocks.32.attn1.to_k.weight",
"transformer_blocks.32.attn1.to_out.0.weight",
"transformer_blocks.32.attn1.to_q.weight",
"transformer_blocks.32.attn1.to_v.weight",
"transformer_blocks.32.attn2.to_out.0.weight",
"transformer_blocks.32.attn2.to_q.weight",
"transformer_blocks.32.audio_attn1.to_k.weight",
"transformer_blocks.32.audio_attn1.to_out.0.weight",
"transformer_blocks.32.audio_attn1.to_q.weight",
"transformer_blocks.32.audio_attn1.to_v.weight",
"transformer_blocks.32.audio_attn2.to_k.weight",
"transformer_blocks.32.audio_attn2.to_out.0.weight",
"transformer_blocks.32.audio_attn2.to_q.weight",
"transformer_blocks.32.audio_attn2.to_v.weight",
"transformer_blocks.32.audio_ff.net.0.proj.weight",
"transformer_blocks.32.audio_ff.net.2.weight",
"transformer_blocks.32.audio_to_video_attn.to_k.weight",
"transformer_blocks.32.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.32.audio_to_video_attn.to_q.weight",
"transformer_blocks.32.audio_to_video_attn.to_v.weight",
"transformer_blocks.32.ff.net.0.proj.weight",
"transformer_blocks.32.ff.net.2.weight",
"transformer_blocks.32.video_to_audio_attn.to_k.weight",
"transformer_blocks.32.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.32.video_to_audio_attn.to_q.weight",
"transformer_blocks.33.attn1.to_out.0.weight",
"transformer_blocks.33.attn1.to_q.weight",
"transformer_blocks.33.attn1.to_v.weight",
"transformer_blocks.33.attn2.to_out.0.weight",
"transformer_blocks.33.attn2.to_q.weight",
"transformer_blocks.33.audio_attn1.to_k.weight",
"transformer_blocks.33.audio_attn1.to_out.0.weight",
"transformer_blocks.33.audio_attn1.to_q.weight",
"transformer_blocks.33.audio_attn1.to_v.weight",
"transformer_blocks.33.audio_attn2.to_k.weight",
"transformer_blocks.33.audio_attn2.to_out.0.weight",
"transformer_blocks.33.audio_attn2.to_q.weight",
"transformer_blocks.33.audio_attn2.to_v.weight",
"transformer_blocks.33.audio_ff.net.0.proj.weight",
"transformer_blocks.33.audio_ff.net.2.weight",
"transformer_blocks.33.audio_to_video_attn.to_k.weight",
"transformer_blocks.33.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.33.audio_to_video_attn.to_q.weight",
"transformer_blocks.33.audio_to_video_attn.to_v.weight",
"transformer_blocks.33.ff.net.0.proj.weight",
"transformer_blocks.33.ff.net.2.weight",
"transformer_blocks.33.video_to_audio_attn.to_k.weight",
"transformer_blocks.33.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.33.video_to_audio_attn.to_q.weight",
"transformer_blocks.33.video_to_audio_attn.to_v.weight",
"transformer_blocks.34.attn1.to_k.weight",
"transformer_blocks.34.attn1.to_out.0.weight",
"transformer_blocks.34.attn1.to_q.weight",
"transformer_blocks.34.attn1.to_v.weight",
"transformer_blocks.34.attn2.to_q.weight",
"transformer_blocks.34.audio_attn1.to_k.weight",
"transformer_blocks.34.audio_attn1.to_out.0.weight",
"transformer_blocks.34.audio_attn1.to_q.weight",
"transformer_blocks.34.audio_attn1.to_v.weight",
"transformer_blocks.34.audio_attn2.to_k.weight",
"transformer_blocks.34.audio_attn2.to_out.0.weight",
"transformer_blocks.34.audio_attn2.to_q.weight",
"transformer_blocks.34.audio_attn2.to_v.weight",
"transformer_blocks.34.audio_ff.net.0.proj.weight",
"transformer_blocks.34.audio_ff.net.2.weight",
"transformer_blocks.34.audio_to_video_attn.to_k.weight",
"transformer_blocks.34.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.34.audio_to_video_attn.to_q.weight",
"transformer_blocks.34.audio_to_video_attn.to_v.weight",
"transformer_blocks.34.ff.net.0.proj.weight",
"transformer_blocks.34.ff.net.2.weight",
"transformer_blocks.34.video_to_audio_attn.to_k.weight",
"transformer_blocks.34.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.34.video_to_audio_attn.to_q.weight",
"transformer_blocks.34.video_to_audio_attn.to_v.weight",
"transformer_blocks.35.attn1.to_k.weight",
"transformer_blocks.35.attn1.to_out.0.weight",
"transformer_blocks.35.attn1.to_q.weight",
"transformer_blocks.35.attn1.to_v.weight",
"transformer_blocks.35.attn2.to_q.weight",
"transformer_blocks.35.audio_attn1.to_k.weight",
"transformer_blocks.35.audio_attn1.to_out.0.weight",
"transformer_blocks.35.audio_attn1.to_q.weight",
"transformer_blocks.35.audio_attn1.to_v.weight",
"transformer_blocks.35.audio_attn2.to_k.weight",
"transformer_blocks.35.audio_attn2.to_out.0.weight",
"transformer_blocks.35.audio_attn2.to_q.weight",
"transformer_blocks.35.audio_attn2.to_v.weight",
"transformer_blocks.35.audio_ff.net.0.proj.weight",
"transformer_blocks.35.audio_ff.net.2.weight",
"transformer_blocks.35.audio_to_video_attn.to_k.weight",
"transformer_blocks.35.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.35.audio_to_video_attn.to_q.weight",
"transformer_blocks.35.audio_to_video_attn.to_v.weight",
"transformer_blocks.35.ff.net.0.proj.weight",
"transformer_blocks.35.ff.net.2.weight",
"transformer_blocks.35.video_to_audio_attn.to_k.weight",
"transformer_blocks.35.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.35.video_to_audio_attn.to_q.weight",
"transformer_blocks.35.video_to_audio_attn.to_v.weight",
"transformer_blocks.36.attn1.to_k.weight",
"transformer_blocks.36.attn1.to_out.0.weight",
"transformer_blocks.36.attn1.to_q.weight",
"transformer_blocks.36.attn1.to_v.weight",
"transformer_blocks.36.attn2.to_q.weight",
"transformer_blocks.36.audio_attn1.to_k.weight",
"transformer_blocks.36.audio_attn1.to_out.0.weight",
"transformer_blocks.36.audio_attn1.to_q.weight",
"transformer_blocks.36.audio_attn2.to_k.weight",
"transformer_blocks.36.audio_attn2.to_out.0.weight",
"transformer_blocks.36.audio_attn2.to_q.weight",
"transformer_blocks.36.audio_attn2.to_v.weight",
"transformer_blocks.36.audio_ff.net.0.proj.weight",
"transformer_blocks.36.audio_ff.net.2.weight",
"transformer_blocks.36.audio_to_video_attn.to_k.weight",
"transformer_blocks.36.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.36.audio_to_video_attn.to_q.weight",
"transformer_blocks.36.ff.net.0.proj.weight",
"transformer_blocks.36.ff.net.2.weight",
"transformer_blocks.36.video_to_audio_attn.to_k.weight",
"transformer_blocks.36.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.36.video_to_audio_attn.to_q.weight",
"transformer_blocks.36.video_to_audio_attn.to_v.weight",
"transformer_blocks.37.attn1.to_out.0.weight",
"transformer_blocks.37.attn1.to_q.weight",
"transformer_blocks.37.attn2.to_q.weight",
"transformer_blocks.37.audio_attn1.to_k.weight",
"transformer_blocks.37.audio_attn1.to_out.0.weight",
"transformer_blocks.37.audio_attn1.to_q.weight",
"transformer_blocks.37.audio_attn1.to_v.weight",
"transformer_blocks.37.audio_attn2.to_k.weight",
"transformer_blocks.37.audio_attn2.to_out.0.weight",
"transformer_blocks.37.audio_attn2.to_q.weight",
"transformer_blocks.37.audio_attn2.to_v.weight",
"transformer_blocks.37.audio_to_video_attn.to_k.weight",
"transformer_blocks.37.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.37.audio_to_video_attn.to_q.weight",
"transformer_blocks.37.audio_to_video_attn.to_v.weight",
"transformer_blocks.37.ff.net.0.proj.weight",
"transformer_blocks.37.video_to_audio_attn.to_k.weight",
"transformer_blocks.37.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.37.video_to_audio_attn.to_q.weight",
"transformer_blocks.37.video_to_audio_attn.to_v.weight",
"transformer_blocks.37.audio_ff.net.0.proj.weight",
"transformer_blocks.37.audio_ff.net.2.weight",
"transformer_blocks.37.ff.net.2.weight",
"transformer_blocks.38.attn1.to_out.0.weight",
"transformer_blocks.38.attn1.to_q.weight",
"transformer_blocks.38.attn2.to_q.weight",
"transformer_blocks.38.audio_attn1.to_k.weight",
"transformer_blocks.38.audio_attn1.to_out.0.weight",
"transformer_blocks.38.audio_attn1.to_q.weight",
"transformer_blocks.38.audio_attn2.to_k.weight",
"transformer_blocks.38.audio_attn2.to_out.0.weight",
"transformer_blocks.38.audio_attn2.to_q.weight",
"transformer_blocks.38.audio_attn2.to_v.weight",
"transformer_blocks.38.audio_ff.net.0.proj.weight",
"transformer_blocks.38.audio_ff.net.2.weight",
"transformer_blocks.38.audio_to_video_attn.to_k.weight",
"transformer_blocks.38.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.38.audio_to_video_attn.to_q.weight",
"transformer_blocks.38.ff.net.0.proj.weight",
"transformer_blocks.38.ff.net.2.weight",
"transformer_blocks.38.video_to_audio_attn.to_k.weight",
"transformer_blocks.38.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.38.video_to_audio_attn.to_q.weight",
"transformer_blocks.38.video_to_audio_attn.to_v.weight",
"transformer_blocks.39.attn1.to_out.0.weight",
"transformer_blocks.39.attn1.to_q.weight",
"transformer_blocks.39.attn2.to_q.weight",
"transformer_blocks.39.audio_attn1.to_k.weight",
"transformer_blocks.39.audio_attn1.to_out.0.weight",
"transformer_blocks.39.audio_attn1.to_q.weight",
"transformer_blocks.39.audio_attn1.to_v.weight",
"transformer_blocks.39.audio_attn2.to_k.weight",
"transformer_blocks.39.audio_attn2.to_out.0.weight",
"transformer_blocks.39.audio_attn2.to_q.weight",
"transformer_blocks.39.audio_attn2.to_v.weight",
"transformer_blocks.39.audio_ff.net.0.proj.weight",
"transformer_blocks.39.audio_ff.net.2.weight",
"transformer_blocks.39.audio_to_video_attn.to_k.weight",
"transformer_blocks.39.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.39.audio_to_video_attn.to_q.weight",
"transformer_blocks.39.audio_to_video_attn.to_v.weight",
"transformer_blocks.39.ff.net.0.proj.weight",
"transformer_blocks.39.ff.net.2.weight",
"transformer_blocks.39.video_to_audio_attn.to_k.weight",
"transformer_blocks.39.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.39.video_to_audio_attn.to_q.weight",
"transformer_blocks.39.video_to_audio_attn.to_v.weight",
"transformer_blocks.40.attn1.to_out.0.weight",
"transformer_blocks.40.attn1.to_q.weight",
"transformer_blocks.40.attn2.to_q.weight",
"transformer_blocks.40.audio_attn1.to_k.weight",
"transformer_blocks.40.audio_attn1.to_out.0.weight",
"transformer_blocks.40.audio_attn1.to_q.weight",
"transformer_blocks.40.audio_attn1.to_v.weight",
"transformer_blocks.40.audio_attn2.to_k.weight",
"transformer_blocks.40.audio_attn2.to_out.0.weight",
"transformer_blocks.40.audio_attn2.to_q.weight",
"transformer_blocks.40.audio_attn2.to_v.weight",
"transformer_blocks.40.audio_ff.net.0.proj.weight",
"transformer_blocks.40.audio_ff.net.2.weight",
"transformer_blocks.40.audio_to_video_attn.to_k.weight",
"transformer_blocks.40.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.40.audio_to_video_attn.to_q.weight",
"transformer_blocks.40.audio_to_video_attn.to_v.weight",
"transformer_blocks.40.ff.net.0.proj.weight",
"transformer_blocks.40.ff.net.2.weight",
"transformer_blocks.40.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.40.video_to_audio_attn.to_q.weight",
"transformer_blocks.40.video_to_audio_attn.to_v.weight",
"transformer_blocks.41.attn1.to_out.0.weight",
"transformer_blocks.41.attn1.to_q.weight",
"transformer_blocks.41.attn2.to_q.weight",
"transformer_blocks.41.audio_attn1.to_k.weight",
"transformer_blocks.41.audio_attn1.to_out.0.weight",
"transformer_blocks.41.audio_attn1.to_q.weight",
"transformer_blocks.41.audio_attn2.to_k.weight",
"transformer_blocks.41.audio_attn2.to_out.0.weight",
"transformer_blocks.41.audio_attn2.to_q.weight",
"transformer_blocks.41.audio_attn2.to_v.weight",
"transformer_blocks.41.audio_ff.net.0.proj.weight",
"transformer_blocks.41.audio_ff.net.2.weight",
"transformer_blocks.41.audio_to_video_attn.to_k.weight",
"transformer_blocks.41.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.41.audio_to_video_attn.to_q.weight",
"transformer_blocks.41.ff.net.0.proj.weight",
"transformer_blocks.41.ff.net.2.weight",
"transformer_blocks.41.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.41.video_to_audio_attn.to_q.weight",
"transformer_blocks.41.video_to_audio_attn.to_v.weight",
"transformer_blocks.42.attn1.to_out.0.weight",
"transformer_blocks.42.attn1.to_q.weight",
"transformer_blocks.42.attn2.to_q.weight",
"transformer_blocks.42.audio_attn1.to_k.weight",
"transformer_blocks.42.audio_attn1.to_out.0.weight",
"transformer_blocks.42.audio_attn1.to_q.weight",
"transformer_blocks.42.audio_attn1.to_v.weight",
"transformer_blocks.42.audio_attn2.to_k.weight",
"transformer_blocks.42.audio_attn2.to_out.0.weight",
"transformer_blocks.42.audio_attn2.to_q.weight",
"transformer_blocks.42.audio_attn2.to_v.weight",
"transformer_blocks.42.audio_ff.net.0.proj.weight",
"transformer_blocks.42.audio_to_video_attn.to_k.weight",
"transformer_blocks.42.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.42.audio_to_video_attn.to_q.weight",
"transformer_blocks.42.ff.net.0.proj.weight",
"transformer_blocks.42.ff.net.2.weight",
"transformer_blocks.42.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.42.video_to_audio_attn.to_q.weight",
"transformer_blocks.42.video_to_audio_attn.to_v.weight",
"transformer_blocks.43.attn1.to_out.0.weight",
"transformer_blocks.43.attn1.to_q.weight",
"transformer_blocks.43.attn1.to_v.weight",
"transformer_blocks.43.attn2.to_q.weight",
"transformer_blocks.43.audio_attn1.to_k.weight",
"transformer_blocks.43.audio_attn1.to_out.0.weight",
"transformer_blocks.43.audio_attn1.to_q.weight",
"transformer_blocks.43.audio_attn1.to_v.weight",
"transformer_blocks.43.audio_attn2.to_k.weight",
"transformer_blocks.43.audio_attn2.to_out.0.weight",
"transformer_blocks.43.audio_attn2.to_q.weight",
"transformer_blocks.43.audio_attn2.to_v.weight",
"transformer_blocks.43.audio_ff.net.0.proj.weight",
"transformer_blocks.43.audio_to_video_attn.to_k.weight",
"transformer_blocks.43.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.43.audio_to_video_attn.to_q.weight",
"transformer_blocks.43.audio_to_video_attn.to_v.weight",
"transformer_blocks.43.ff.net.0.proj.weight",
"transformer_blocks.43.ff.net.2.weight",
"transformer_blocks.43.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.43.video_to_audio_attn.to_q.weight",
"transformer_blocks.43.video_to_audio_attn.to_v.weight",
"transformer_blocks.44.attn1.to_out.0.weight",
"transformer_blocks.44.attn1.to_q.weight",
"transformer_blocks.44.attn1.to_v.weight",
"transformer_blocks.44.audio_attn1.to_k.weight",
"transformer_blocks.44.audio_attn1.to_q.weight",
"transformer_blocks.44.audio_attn1.to_v.weight",
"transformer_blocks.44.attn2.to_q.weight",
"transformer_blocks.44.audio_attn1.to_out.0.weight",
"transformer_blocks.44.audio_attn2.to_k.weight",
"transformer_blocks.44.audio_attn2.to_out.0.weight",
"transformer_blocks.44.audio_attn2.to_q.weight",
"transformer_blocks.44.audio_attn2.to_v.weight",
"transformer_blocks.44.audio_ff.net.0.proj.weight",
"transformer_blocks.44.audio_to_video_attn.to_k.weight",
"transformer_blocks.44.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.44.audio_to_video_attn.to_q.weight",
"transformer_blocks.44.audio_to_video_attn.to_v.weight",
"transformer_blocks.44.ff.net.0.proj.weight",
"transformer_blocks.44.ff.net.2.weight",
"transformer_blocks.44.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.44.video_to_audio_attn.to_q.weight",
"transformer_blocks.44.video_to_audio_attn.to_v.weight",
"transformer_blocks.45.attn1.to_out.0.weight",
"transformer_blocks.45.attn1.to_q.weight",
"transformer_blocks.45.attn2.to_q.weight",
"transformer_blocks.45.audio_attn1.to_k.weight",
"transformer_blocks.45.audio_attn1.to_out.0.weight",
"transformer_blocks.45.audio_attn1.to_q.weight",
"transformer_blocks.45.audio_attn1.to_v.weight",
"transformer_blocks.45.audio_attn2.to_k.weight",
"transformer_blocks.45.audio_attn2.to_out.0.weight",
"transformer_blocks.45.audio_attn2.to_q.weight",
"transformer_blocks.45.audio_attn2.to_v.weight",
"transformer_blocks.45.audio_ff.net.0.proj.weight",
"transformer_blocks.45.audio_to_video_attn.to_k.weight",
"transformer_blocks.45.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.45.audio_to_video_attn.to_q.weight",
"transformer_blocks.45.audio_to_video_attn.to_v.weight",
"transformer_blocks.45.ff.net.0.proj.weight",
"transformer_blocks.45.ff.net.2.weight",
"transformer_blocks.45.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.45.video_to_audio_attn.to_q.weight",
"transformer_blocks.45.video_to_audio_attn.to_v.weight",
"transformer_blocks.46.attn1.to_out.0.weight",
"transformer_blocks.46.attn1.to_q.weight",
"transformer_blocks.46.attn2.to_q.weight",
"transformer_blocks.46.audio_attn1.to_out.0.weight",
"transformer_blocks.46.audio_attn1.to_q.weight",
"transformer_blocks.46.audio_attn2.to_k.weight",
"transformer_blocks.46.audio_attn2.to_out.0.weight",
"transformer_blocks.46.audio_attn2.to_q.weight",
"transformer_blocks.46.audio_attn2.to_v.weight",
"transformer_blocks.46.audio_ff.net.0.proj.weight",
"transformer_blocks.46.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.46.audio_to_video_attn.to_q.weight",
"transformer_blocks.46.ff.net.0.proj.weight",
"transformer_blocks.46.ff.net.2.weight",
"transformer_blocks.46.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.46.video_to_audio_attn.to_q.weight",
"transformer_blocks.46.video_to_audio_attn.to_v.weight",
"transformer_blocks.47.attn1.to_out.0.weight",
"transformer_blocks.47.attn2.to_k.weight",
"transformer_blocks.47.attn2.to_q.weight",
"transformer_blocks.47.audio_attn1.to_k.weight",
"transformer_blocks.47.audio_attn1.to_out.0.weight",
"transformer_blocks.47.audio_attn1.to_q.weight",
"transformer_blocks.47.audio_attn2.to_k.weight",
"transformer_blocks.47.audio_attn2.to_q.weight",
"transformer_blocks.47.audio_attn2.to_v.weight",
"transformer_blocks.47.audio_ff.net.0.proj.weight",
"transformer_blocks.47.audio_to_video_attn.to_k.weight",
"transformer_blocks.47.audio_to_video_attn.to_out.0.weight",
"transformer_blocks.47.ff.net.0.proj.weight",
"transformer_blocks.47.video_to_audio_attn.to_out.0.weight",
"transformer_blocks.47.video_to_audio_attn.to_q.weight"
]
},
"modules_to_not_convert": [
"proj_in",
"av_cross_attn_video_scale_shift",
"time_embed",
"av_cross_attn_video_a2v_gate",
"audio_time_embed",
"audio_proj_out",
"av_cross_attn_audio_v2a_gate",
"proj_out",
"av_cross_attn_audio_scale_shift",
"audio_caption_projection",
"audio_proj_in",
"caption_projection"
],
"non_blocking": false,
"quant_conv": false,
"quant_method": "sdnq",
"quantization_device": null,
"quantized_matmul_dtype": "int8",
"return_device": null,
"sdnq_version": "0.1.4",
"svd_rank": 32,
"svd_steps": 8,
"use_dynamic_quantization": true,
"use_grad_ckpt": true,
"use_quantized_matmul": false,
"use_quantized_matmul_conv": false,
"use_static_quantization": true,
"use_stochastic_rounding": false,
"use_svd": false,
"weights_dtype": "int4"
}