registry / registry.json
zkeown's picture
Update registry with all model packages
6302d26 verified
{
"schemaVersion": "1.0.0",
"organization": "schismaudio",
"models": [
{
"expertId": "melroformer-full",
"expertIds": [
"melroformer-full"
],
"name": "MelRoFormer Full",
"repo": "schismaudio/melroformer-full",
"version": "1.0.0",
"tasks": [
"vocalSeparation"
],
"qualityTier": "high",
"estimatedRTF": 0.6,
"peakMemoryMB": 850,
"inputKind": "mix",
"outputKind": "stem",
"description": "Full Mel-Band RoFormer (~72M params) for high-quality vocal separation",
"fileSizeMB": 436
},
{
"expertId": "melroformer-lightweight",
"expertIds": [
"melroformer-lightweight"
],
"name": "MelRoFormer Lightweight",
"repo": "schismaudio/melroformer-lightweight",
"version": "1.0.0",
"tasks": [
"vocalSeparation"
],
"qualityTier": "medium",
"estimatedRTF": 0.3,
"peakMemoryMB": 256,
"inputKind": "mix",
"outputKind": "stem",
"description": "Lightweight Mel-Band RoFormer (~34M params) for fast vocal separation",
"fileSizeMB": 65
},
{
"expertId": "scnet-base",
"expertIds": [
"scnet-base"
],
"name": "SCNet Base",
"repo": "schismaudio/scnet-base",
"version": "1.0.0",
"tasks": [
"stemSeparation",
"vocalSeparation"
],
"qualityTier": "medium",
"estimatedRTF": 0.6,
"peakMemoryMB": 1024,
"inputKind": "mix",
"outputKind": "stems",
"description": "SCNet Base (~10M params) for 4-stem separation",
"outputStems": [
"drums",
"bass",
"other",
"vocals"
],
"fileSizeMB": 44
},
{
"expertId": "scnet-large",
"expertIds": [
"scnet-large"
],
"name": "SCNet Large",
"repo": "schismaudio/scnet-large",
"version": "1.0.0",
"tasks": [
"stemSeparation",
"vocalSeparation"
],
"qualityTier": "high",
"estimatedRTF": 0.8,
"peakMemoryMB": 1600,
"inputKind": "mix",
"outputKind": "stems",
"description": "SCNet Large (~41M params) for higher-quality 4-stem separation",
"outputStems": [
"drums",
"bass",
"other",
"vocals"
],
"fileSizeMB": 165
},
{
"expertId": "apollo",
"expertIds": [
"apollo"
],
"name": "Apollo Enhancement",
"repo": "schismaudio/apollo",
"version": "1.0.0",
"tasks": [
"audioEnhancement"
],
"qualityTier": "high",
"estimatedRTF": 1.6,
"peakMemoryMB": 128,
"inputKind": "any",
"outputKind": "any",
"description": "Apollo audio enhancement model for post-separation cleanup",
"fileSizeMB": 33
},
{
"expertId": "bsroformer-base",
"expertIds": [
"bsroformer-base"
],
"name": "BS-RoFormer Base",
"repo": "schismaudio/bsroformer-base",
"version": "1.0.0",
"tasks": [
"stemSeparation",
"vocalSeparation"
],
"qualityTier": "high",
"estimatedRTF": 1.0,
"peakMemoryMB": 330,
"inputKind": "mix",
"outputKind": "stems",
"description": "Band-Split RoFormer for high-quality 4-stem separation",
"outputStems": [
"drums",
"bass",
"other",
"vocals"
],
"fileSizeMB": 253
},
{
"expertId": "dttnet",
"expertIds": [
"dttnet-vocals",
"dttnet-drums",
"dttnet-bass",
"dttnet-other"
],
"name": "DTTNet (All Stems)",
"repo": "schismaudio/dttnet",
"version": "1.0.0",
"tasks": [
"vocalSeparation",
"stemSeparation"
],
"qualityTier": "high",
"estimatedRTF": 0.4,
"peakMemoryMB": 384,
"inputKind": "mix",
"outputKind": "stem",
"description": "Dual Time-Frequency Transformer per-stem models (vocals, drums, bass, other)",
"fileSizeMB": 75
},
{
"expertId": "htdemucs-ft",
"expertIds": [
"htdemucs-ft-vocals",
"htdemucs-ft-drums",
"htdemucs-ft-bass",
"htdemucs-ft-other"
],
"name": "HTDemucs Fine-Tuned (All Stems)",
"repo": "schismaudio/htdemucs-ft",
"version": "1.0.0",
"tasks": [
"vocalSeparation",
"stemSeparation"
],
"qualityTier": "high",
"estimatedRTF": 1.0,
"peakMemoryMB": 250,
"inputKind": "mix",
"outputKind": "stem",
"description": "Hybrid Transformer Demucs fine-tuned per-stem models",
"fileSizeMB": 821
},
{
"expertId": "htdemucs-6s",
"expertIds": [
"htdemucs-6s"
],
"name": "HTDemucs 6-Source",
"repo": "schismaudio/htdemucs-6s",
"version": "1.0.0",
"tasks": [
"stemSeparation"
],
"qualityTier": "medium",
"estimatedRTF": 1.0,
"peakMemoryMB": 500,
"inputKind": "mix",
"outputKind": "stems",
"description": "HTDemucs 6-source model for vocals/drums/bass/other/guitar/piano separation",
"outputStems": [
"drums",
"bass",
"other",
"vocals",
"guitar",
"piano"
],
"fileSizeMB": 146
},
{
"expertId": "banquet",
"expertIds": [
"banquet-vocals",
"banquet-drums",
"banquet-bass",
"banquet-other",
"banquet-guitar",
"banquet-piano",
"banquet-query"
],
"name": "Banquet (Query-Based Separation)",
"repo": "schismaudio/banquet",
"version": "1.0.0",
"tasks": [
"vocalSeparation",
"stemSeparation"
],
"qualityTier": "medium",
"estimatedRTF": 2.5,
"peakMemoryMB": 450,
"inputKind": "mix",
"outputKind": "stem",
"description": "Query-based multi-stem separation with PaSST encoder (6 stems + subcategories)",
"fileSizeMB": 322
},
{
"expertId": "audiosep",
"expertIds": [
"audiosep-base"
],
"name": "AudioSep (Text-Guided Separation)",
"repo": "schismaudio/audiosep",
"version": "1.0.0",
"tasks": [
"textGuidedSeparation"
],
"qualityTier": "medium",
"estimatedRTF": 0.1,
"peakMemoryMB": 600,
"inputKind": "mix",
"outputKind": "stem",
"description": "Text-guided universal sound separation \u2014 describe what to extract in natural language",
"fileSizeMB": 578
},
{
"expertId": "deepfilternet3",
"expertIds": [
"deepfilternet"
],
"name": "DeepFilterNet3 Enhancement",
"repo": "schismaudio/deepfilternet3",
"version": "1.0.0",
"tasks": [
"audioEnhancement"
],
"qualityTier": "medium",
"estimatedRTF": 0.1,
"peakMemoryMB": 50,
"inputKind": "any",
"outputKind": "any",
"description": "DeepFilterNet3 speech enhancement (~2.3M params) \u2014 ERB spectral masking + deep filtering with learned complex FIR filters",
"fileSizeMB": 9
},
{
"expertId": "tfctdfunet",
"expertIds": [
"tfctdfunet-vocals",
"tfctdfunet-drums",
"tfctdfunet-bass",
"tfctdfunet-other"
],
"name": "TFC-TDF-UNet v3 (MDX23)",
"repo": "schismaudio/tfctdfunet",
"version": "1.0.0",
"tasks": [
"vocalSeparation",
"stemSeparation"
],
"qualityTier": "high",
"estimatedRTF": 0.6,
"peakMemoryMB": 350,
"inputKind": "mix",
"outputKind": "stem",
"description": "MDX23 Model-A (TFC-TDF-UNet v3) multi-source separation with subbands",
"fileSizeMB": 115
}
]
}