{ "_name_": "SequenceClassifier", "_model_version_": "1.0.0", "_symupe_version_": "1.1.0", "backbone": { "dim": 768, "token_embeddings": { "_target_": "simple", "emb_dims": 128, "mode": "cat", "emb_norm": true, "discrete": false, "sinusoidal": true, "sinusoidal_learned": true, "project_bias": false, "embedding_kwargs": { "depth": 0, "log_inv_freq": true, "with_positions": false }, "tie_keys": null, "special_tokens": { "PAD_None": 0, "MASK_None": 1, "BOS_None": 2, "EOS_None": 3, "IGNORE_None": 4, "EOD_None": 5, "Bar_Line": 6, "Pedal_On": 7, "Pedal_Off": 8 } }, "emb_norm": false, "emb_dropout": 0.0, "use_abs_pos_emb": false, "project_bias": false, "transformer": { "_target_": "encoder", "depth": 12, "memory_tokens": 4, "final_norm_bias": false, "attention": { "_target_": "global", "heads": 12, "head_dim": 64, "one_kv_head": true, "dropout": 0.05, "rotary_pos_emb": true, "rotary_emb_base": 1024, "alibi_pos_bias": false, "alibi_learned": true, "alibi_heads": 8 }, "feed_forward": { "mult": 3, "glu": true, "swish": true, "dropout": 0.05 } }, "lm_head": null, "num_tokens": { "Pitch": 97, "TimeShift": 595, "Velocity": 42, "TimeDurationSustain": 560, "TimePosition": 2409 } }, "backbone_checkpoint": null, "transformer": { "dim": 128, "depth": 1, "final_norm_bias": false, "attention": { "_target_": "global", "heads": 2, "head_dim": 64, "one_kv_head": true, "dropout": 0.2 }, "feed_forward": { "mult": 1, "glu": false, "swish": true, "dropout": 0.2 } }, "classifier": { "hidden_dims": null }, "aggregation": "token", "emb_norm": false, "emb_dropout": 0.3, "clf_dropout": 0.3, "context_with_memory": true, "backbone_output_layer": 10, "num_classes": 4, "note_classifier": false, "label_smoothing": 0.0, "detach_inputs": true, "memory_norm": false, "labels": { "0": "score", "1": "high quality", "2": "low quality", "3": "corrupted" } }