{ "model_target": "hypnos.models.rq_transformer.MultiModalRQTransformer", "model_kwargs": { "channel_embeddings": true, "cls_independent_crp": false, "depth_depth": 4, "depth_dim": 384, "depth_heads": 6, "depth_mlp_ratio": 4.0, "dropout": 0.1, "embed_dim": 768, "global_every_n": 4, "global_window": 256, "layer_scale_init": 0.01, "max_seq_len": 16384, "mod_context_dropout_p": 0.0, "modality_attn_every_n": 1, "modality_attn_start_layer": 0, "modality_grouping_alpha": 1.0, "modality_loss_weights": null, "modality_use_ffn": false, "qk_norm": true, "random_subset_masking": false, "share_trunk_depth_emb": false, "sliding_window": 64, "swiglu": true, "temporal_depth": 12, "temporal_heads": 12, "temporal_mlp_ratio": 4.0, "tie_depth_io": false, "use_activation_checkpointing": false, "use_cls": false, "xsa": false }, "modalities": [ { "name": "eeg_c3", "signal_type": "eeg", "channels": [ "C3" ], "tokenizer": "eeg-q8-causal", "num_quantizers": 8, "codebook_size": 2048, "token_duration_sec": 1.0, "sample_rate": 128, "preprocess_modality": "eeg" }, { "name": "eeg_c4", "signal_type": "eeg", "channels": [ "C4" ], "tokenizer": "eeg-q8-causal", "num_quantizers": 8, "codebook_size": 2048, "token_duration_sec": 1.0, "sample_rate": 128, "preprocess_modality": "eeg" }, { "name": "ecg", "signal_type": "ecg", "channels": [ "ECG" ], "tokenizer": "ecg-q4-causal", "num_quantizers": 4, "codebook_size": 2048, "token_duration_sec": 1.0, "sample_rate": 128, "preprocess_modality": "ecg" }, { "name": "resp_abd", "signal_type": "resp", "channels": [ "ABD" ], "tokenizer": "resp-q4-causal", "num_quantizers": 4, "codebook_size": 2048, "token_duration_sec": 1.0, "sample_rate": 32, "preprocess_modality": "respiratory" }, { "name": "resp_thx", "signal_type": "resp", "channels": [ "THX" ], "tokenizer": "resp-q4-causal", "num_quantizers": 4, "codebook_size": 2048, "token_duration_sec": 1.0, "sample_rate": 32, "preprocess_modality": "respiratory" }, { "name": "emg_chin", "signal_type": "emg", "channels": [ "Chin" ], "tokenizer": "emg-q8-causal", "num_quantizers": 8, "codebook_size": 2048, "token_duration_sec": 1.0, "sample_rate": 128, "preprocess_modality": "emg" }, { "name": "eog_e1", "signal_type": "eog", "channels": [ "E1" ], "tokenizer": "eog-q8-causal", "num_quantizers": 8, "codebook_size": 2048, "token_duration_sec": 1.0, "sample_rate": 128, "preprocess_modality": "eeg" }, { "name": "eog_e2", "signal_type": "eog", "channels": [ "E2" ], "tokenizer": "eog-q8-causal", "num_quantizers": 8, "codebook_size": 2048, "token_duration_sec": 1.0, "sample_rate": 128, "preprocess_modality": "eeg" } ], "tokenizers": { "eeg-q8-causal": { "signal_type": "eeg", "num_quantizers": 8, "codebook_size": 2048, "token_duration_sec": 1.0, "sample_rate": 128, "tokenizer_kwargs": { "activation": "elu", "attention_depth": 4, "attention_heads": 8, "causal": true, "codebook_dim": 256, "codebook_size": 2048, "commitment_cost": 0.25, "dilation_base": 2, "ema_decay": 0.99, "embed_dim": 512, "in_channels": 1, "last_kernel_size": 7, "latent_dim": null, "layer_scale_init": 0.01, "mode": "discrete", "n_filters": 64, "n_residual_layers": 1, "norm": "weight", "num_quantizers": 8, "pad_mode": "reflect", "quantization_dropout": 0.5, "quantizer_dropout": 0.0, "ratios": [ 2, 4, 4, 4 ], "rotation_trick": true, "sample_rate": 128, "stride_kernel_multiplier": 2, "token_duration_sec": 1.0, "transformer_dim_feedforward": 2048, "use_activation_checkpointing": false, "window_size": 32 } }, "ecg-q4-causal": { "signal_type": "ecg", "num_quantizers": 4, "codebook_size": 2048, "token_duration_sec": 1.0, "sample_rate": 128, "tokenizer_kwargs": { "activation": "elu", "attention_depth": 4, "attention_heads": 8, "causal": true, "codebook_dim": 256, "codebook_size": 2048, "commitment_cost": 0.25, "dilation_base": 2, "ema_decay": 0.99, "embed_dim": 512, "in_channels": 1, "last_kernel_size": 7, "latent_dim": null, "layer_scale_init": 0.01, "mode": "discrete", "n_filters": 64, "n_residual_layers": 1, "norm": "weight", "num_quantizers": 4, "pad_mode": "reflect", "quantization_dropout": 0.5, "quantizer_dropout": 0.0, "ratios": [ 2, 4, 4, 4 ], "rotation_trick": true, "sample_rate": 128, "stride_kernel_multiplier": 2, "token_duration_sec": 1.0, "transformer_dim_feedforward": 2048, "use_activation_checkpointing": false, "window_size": 32 } }, "resp-q4-causal": { "signal_type": "resp", "num_quantizers": 4, "codebook_size": 2048, "token_duration_sec": 1.0, "sample_rate": 32, "tokenizer_kwargs": { "activation": "elu", "attention_depth": 4, "attention_heads": 8, "causal": true, "codebook_dim": 256, "codebook_size": 2048, "commitment_cost": 0.25, "dilation_base": 2, "ema_decay": 0.99, "embed_dim": 512, "in_channels": 1, "last_kernel_size": 7, "latent_dim": null, "layer_scale_init": 0.01, "mode": "discrete", "n_filters": 64, "n_residual_layers": 1, "norm": "weight", "num_quantizers": 4, "pad_mode": "reflect", "quantization_dropout": 0.5, "quantizer_dropout": 0.0, "ratios": [ 4, 4, 2 ], "rotation_trick": true, "sample_rate": 32, "stride_kernel_multiplier": 2, "token_duration_sec": 1.0, "transformer_dim_feedforward": 2048, "use_activation_checkpointing": false, "window_size": 32 } }, "emg-q8-causal": { "signal_type": "emg", "num_quantizers": 8, "codebook_size": 2048, "token_duration_sec": 1.0, "sample_rate": 128, "tokenizer_kwargs": { "activation": "elu", "attention_depth": 4, "attention_heads": 8, "causal": true, "codebook_dim": 256, "codebook_size": 2048, "commitment_cost": 0.25, "dilation_base": 2, "ema_decay": 0.99, "embed_dim": 512, "in_channels": 1, "last_kernel_size": 7, "latent_dim": null, "layer_scale_init": 0.01, "mode": "discrete", "n_filters": 64, "n_residual_layers": 1, "norm": "weight", "num_quantizers": 8, "pad_mode": "reflect", "quantization_dropout": 0.5, "quantizer_dropout": 0.0, "ratios": [ 2, 4, 4, 4 ], "rotation_trick": true, "sample_rate": 128, "stride_kernel_multiplier": 2, "token_duration_sec": 1.0, "transformer_dim_feedforward": 2048, "use_activation_checkpointing": false, "window_size": 32 } }, "eog-q8-causal": { "signal_type": "eog", "num_quantizers": 8, "codebook_size": 2048, "token_duration_sec": 1.0, "sample_rate": 128, "tokenizer_kwargs": { "activation": "elu", "attention_depth": 4, "attention_heads": 8, "causal": true, "codebook_dim": 256, "codebook_size": 2048, "commitment_cost": 0.25, "dilation_base": 2, "ema_decay": 0.99, "embed_dim": 512, "in_channels": 1, "last_kernel_size": 7, "latent_dim": null, "layer_scale_init": 0.01, "mode": "discrete", "n_filters": 64, "n_residual_layers": 1, "norm": "weight", "num_quantizers": 8, "pad_mode": "reflect", "quantization_dropout": 0.5, "quantizer_dropout": 0.0, "ratios": [ 2, 4, 4, 4 ], "rotation_trick": true, "sample_rate": 128, "stride_kernel_multiplier": 2, "token_duration_sec": 1.0, "transformer_dim_feedforward": 2048, "use_activation_checkpointing": false, "window_size": 32 } } } }