{ "_class_name": "FoleyOmniConfig", "_name_or_path": "CocoBro/Foley-Omni", "architectures": [ "FoleyOmniDiT" ], "model_type": "t2a", "patch_size": [1], "dim": 3072, "ffn_dim": 14336, "freq_dim": 256, "num_heads": 24, "num_layers": 30, "in_dim": 20, "out_dim": 20, "text_len": 512, "window_size": [-1, -1], "qk_norm": true, "cross_attn_norm": true, "eps": 1e-6, "temporal_rope_scaling_factor": 0.19676, "sync_drop_from_context": false, "sync_add_to_audio": true, "sync_add_to_audio_each_block": true, "sync_use_adaln": false, "sync_use_proj": true, "sync_use_adapter": true, "sync_adapter_type": "depthwise_conv", "sync_adapter_kernel_size": 5, "sync_adapter_expansion": 2.0, "use_continuous_time_context_rope": false, "continuous_time_context_rope_mode": "auto", "use_text_context_rope": true, "use_clip_context_rope": true, "use_sync_context_rope": true, "context_rope_theta": 10000.0, "context_text_rope_scaling": 1.0, "context_clip_rope_scaling": 1.0, "context_sync_rope_scaling": 1.0 }