hypnos / config.json
joncarter's picture
Add config.json (enables Hub download tracking)
a5593e6 verified
{
"model_target": "hypnos.models.rq_transformer.MultiModalRQTransformer",
"model_kwargs": {
"channel_embeddings": true,
"cls_independent_crp": false,
"depth_depth": 4,
"depth_dim": 384,
"depth_heads": 6,
"depth_mlp_ratio": 4.0,
"dropout": 0.1,
"embed_dim": 768,
"global_every_n": 4,
"global_window": 256,
"layer_scale_init": 0.01,
"max_seq_len": 16384,
"mod_context_dropout_p": 0.0,
"modality_attn_every_n": 1,
"modality_attn_start_layer": 0,
"modality_grouping_alpha": 1.0,
"modality_loss_weights": null,
"modality_use_ffn": false,
"qk_norm": true,
"random_subset_masking": false,
"share_trunk_depth_emb": false,
"sliding_window": 64,
"swiglu": true,
"temporal_depth": 12,
"temporal_heads": 12,
"temporal_mlp_ratio": 4.0,
"tie_depth_io": false,
"use_activation_checkpointing": false,
"use_cls": false,
"xsa": false
},
"modalities": [
{
"name": "eeg_c3",
"signal_type": "eeg",
"channels": [
"C3"
],
"tokenizer": "eeg-q8-causal",
"num_quantizers": 8,
"codebook_size": 2048,
"token_duration_sec": 1.0,
"sample_rate": 128,
"preprocess_modality": "eeg"
},
{
"name": "eeg_c4",
"signal_type": "eeg",
"channels": [
"C4"
],
"tokenizer": "eeg-q8-causal",
"num_quantizers": 8,
"codebook_size": 2048,
"token_duration_sec": 1.0,
"sample_rate": 128,
"preprocess_modality": "eeg"
},
{
"name": "ecg",
"signal_type": "ecg",
"channels": [
"ECG"
],
"tokenizer": "ecg-q4-causal",
"num_quantizers": 4,
"codebook_size": 2048,
"token_duration_sec": 1.0,
"sample_rate": 128,
"preprocess_modality": "ecg"
},
{
"name": "resp_abd",
"signal_type": "resp",
"channels": [
"ABD"
],
"tokenizer": "resp-q4-causal",
"num_quantizers": 4,
"codebook_size": 2048,
"token_duration_sec": 1.0,
"sample_rate": 32,
"preprocess_modality": "respiratory"
},
{
"name": "resp_thx",
"signal_type": "resp",
"channels": [
"THX"
],
"tokenizer": "resp-q4-causal",
"num_quantizers": 4,
"codebook_size": 2048,
"token_duration_sec": 1.0,
"sample_rate": 32,
"preprocess_modality": "respiratory"
},
{
"name": "emg_chin",
"signal_type": "emg",
"channels": [
"Chin"
],
"tokenizer": "emg-q8-causal",
"num_quantizers": 8,
"codebook_size": 2048,
"token_duration_sec": 1.0,
"sample_rate": 128,
"preprocess_modality": "emg"
},
{
"name": "eog_e1",
"signal_type": "eog",
"channels": [
"E1"
],
"tokenizer": "eog-q8-causal",
"num_quantizers": 8,
"codebook_size": 2048,
"token_duration_sec": 1.0,
"sample_rate": 128,
"preprocess_modality": "eeg"
},
{
"name": "eog_e2",
"signal_type": "eog",
"channels": [
"E2"
],
"tokenizer": "eog-q8-causal",
"num_quantizers": 8,
"codebook_size": 2048,
"token_duration_sec": 1.0,
"sample_rate": 128,
"preprocess_modality": "eeg"
}
],
"tokenizers": {
"eeg-q8-causal": {
"signal_type": "eeg",
"num_quantizers": 8,
"codebook_size": 2048,
"token_duration_sec": 1.0,
"sample_rate": 128,
"tokenizer_kwargs": {
"activation": "elu",
"attention_depth": 4,
"attention_heads": 8,
"causal": true,
"codebook_dim": 256,
"codebook_size": 2048,
"commitment_cost": 0.25,
"dilation_base": 2,
"ema_decay": 0.99,
"embed_dim": 512,
"in_channels": 1,
"last_kernel_size": 7,
"latent_dim": null,
"layer_scale_init": 0.01,
"mode": "discrete",
"n_filters": 64,
"n_residual_layers": 1,
"norm": "weight",
"num_quantizers": 8,
"pad_mode": "reflect",
"quantization_dropout": 0.5,
"quantizer_dropout": 0.0,
"ratios": [
2,
4,
4,
4
],
"rotation_trick": true,
"sample_rate": 128,
"stride_kernel_multiplier": 2,
"token_duration_sec": 1.0,
"transformer_dim_feedforward": 2048,
"use_activation_checkpointing": false,
"window_size": 32
}
},
"ecg-q4-causal": {
"signal_type": "ecg",
"num_quantizers": 4,
"codebook_size": 2048,
"token_duration_sec": 1.0,
"sample_rate": 128,
"tokenizer_kwargs": {
"activation": "elu",
"attention_depth": 4,
"attention_heads": 8,
"causal": true,
"codebook_dim": 256,
"codebook_size": 2048,
"commitment_cost": 0.25,
"dilation_base": 2,
"ema_decay": 0.99,
"embed_dim": 512,
"in_channels": 1,
"last_kernel_size": 7,
"latent_dim": null,
"layer_scale_init": 0.01,
"mode": "discrete",
"n_filters": 64,
"n_residual_layers": 1,
"norm": "weight",
"num_quantizers": 4,
"pad_mode": "reflect",
"quantization_dropout": 0.5,
"quantizer_dropout": 0.0,
"ratios": [
2,
4,
4,
4
],
"rotation_trick": true,
"sample_rate": 128,
"stride_kernel_multiplier": 2,
"token_duration_sec": 1.0,
"transformer_dim_feedforward": 2048,
"use_activation_checkpointing": false,
"window_size": 32
}
},
"resp-q4-causal": {
"signal_type": "resp",
"num_quantizers": 4,
"codebook_size": 2048,
"token_duration_sec": 1.0,
"sample_rate": 32,
"tokenizer_kwargs": {
"activation": "elu",
"attention_depth": 4,
"attention_heads": 8,
"causal": true,
"codebook_dim": 256,
"codebook_size": 2048,
"commitment_cost": 0.25,
"dilation_base": 2,
"ema_decay": 0.99,
"embed_dim": 512,
"in_channels": 1,
"last_kernel_size": 7,
"latent_dim": null,
"layer_scale_init": 0.01,
"mode": "discrete",
"n_filters": 64,
"n_residual_layers": 1,
"norm": "weight",
"num_quantizers": 4,
"pad_mode": "reflect",
"quantization_dropout": 0.5,
"quantizer_dropout": 0.0,
"ratios": [
4,
4,
2
],
"rotation_trick": true,
"sample_rate": 32,
"stride_kernel_multiplier": 2,
"token_duration_sec": 1.0,
"transformer_dim_feedforward": 2048,
"use_activation_checkpointing": false,
"window_size": 32
}
},
"emg-q8-causal": {
"signal_type": "emg",
"num_quantizers": 8,
"codebook_size": 2048,
"token_duration_sec": 1.0,
"sample_rate": 128,
"tokenizer_kwargs": {
"activation": "elu",
"attention_depth": 4,
"attention_heads": 8,
"causal": true,
"codebook_dim": 256,
"codebook_size": 2048,
"commitment_cost": 0.25,
"dilation_base": 2,
"ema_decay": 0.99,
"embed_dim": 512,
"in_channels": 1,
"last_kernel_size": 7,
"latent_dim": null,
"layer_scale_init": 0.01,
"mode": "discrete",
"n_filters": 64,
"n_residual_layers": 1,
"norm": "weight",
"num_quantizers": 8,
"pad_mode": "reflect",
"quantization_dropout": 0.5,
"quantizer_dropout": 0.0,
"ratios": [
2,
4,
4,
4
],
"rotation_trick": true,
"sample_rate": 128,
"stride_kernel_multiplier": 2,
"token_duration_sec": 1.0,
"transformer_dim_feedforward": 2048,
"use_activation_checkpointing": false,
"window_size": 32
}
},
"eog-q8-causal": {
"signal_type": "eog",
"num_quantizers": 8,
"codebook_size": 2048,
"token_duration_sec": 1.0,
"sample_rate": 128,
"tokenizer_kwargs": {
"activation": "elu",
"attention_depth": 4,
"attention_heads": 8,
"causal": true,
"codebook_dim": 256,
"codebook_size": 2048,
"commitment_cost": 0.25,
"dilation_base": 2,
"ema_decay": 0.99,
"embed_dim": 512,
"in_channels": 1,
"last_kernel_size": 7,
"latent_dim": null,
"layer_scale_init": 0.01,
"mode": "discrete",
"n_filters": 64,
"n_residual_layers": 1,
"norm": "weight",
"num_quantizers": 8,
"pad_mode": "reflect",
"quantization_dropout": 0.5,
"quantizer_dropout": 0.0,
"ratios": [
2,
4,
4,
4
],
"rotation_trick": true,
"sample_rate": 128,
"stride_kernel_multiplier": 2,
"token_duration_sec": 1.0,
"transformer_dim_feedforward": 2048,
"use_activation_checkpointing": false,
"window_size": 32
}
}
}
}