| { | |
| "_class_name": "LTX2AudioVisualTextEncoder", | |
| "_diffusers_version": "0.36.0.dev0", | |
| "audio_connector_attention_head_dim": 8, | |
| "audio_connector_num_attention_heads": 4, | |
| "audio_connector_num_layers": 1, | |
| "audio_connector_num_learnable_registers": null, | |
| "causal_temporal_positioning": false, | |
| "config_only": true, | |
| "rope_base_seq_len": 32, | |
| "rope_double_precision": false, | |
| "rope_theta": 10000.0, | |
| "text_encoder_hidden_dim": 32, | |
| "text_model_id": "tiny-random/gemma-3", | |
| "text_proj_in_factor": 3, | |
| "video_connector_attention_head_dim": 8, | |
| "video_connector_num_attention_heads": 4, | |
| "video_connector_num_layers": 1, | |
| "video_connector_num_learnable_registers": null | |
| } | |