| { | |
| "segment_len50": { | |
| "filename": "checkpoints/segment_len50.ckpt", | |
| "class": "SegmentTokenDiscriminator", | |
| "segment_len": 50, | |
| "vocab_size": 65536, | |
| "d_model": 256, | |
| "nhead": 8, | |
| "num_layers": 4, | |
| "dim_feedforward": 1024, | |
| "dropout": 0.1 | |
| }, | |
| "strided_seg50_scale10": { | |
| "filename": "checkpoints/strided_seg50_scale10.ckpt", | |
| "class": "StridedSegmentTokenDiscriminator", | |
| "segment_len": 50, | |
| "scale": 10, | |
| "vocab_size": 65536, | |
| "d_model": 256, | |
| "nhead": 8, | |
| "num_layers": 4, | |
| "dim_feedforward": 1024, | |
| "dropout": 0.1 | |
| }, | |
| "strided_seg50_scale25": { | |
| "filename": "checkpoints/strided_seg50_scale25.ckpt", | |
| "class": "StridedSegmentTokenDiscriminator", | |
| "segment_len": 50, | |
| "scale": 25, | |
| "vocab_size": 65536, | |
| "d_model": 256, | |
| "nhead": 8, | |
| "num_layers": 4, | |
| "dim_feedforward": 1024, | |
| "dropout": 0.1 | |
| }, | |
| "segment_len25": { | |
| "filename": "checkpoints/segment_len25.ckpt", | |
| "class": "SegmentTokenDiscriminator", | |
| "segment_len": 25, | |
| "vocab_size": 65536, | |
| "d_model": 256, | |
| "nhead": 8, | |
| "num_layers": 4, | |
| "dim_feedforward": 1024, | |
| "dropout": 0.1 | |
| }, | |
| "segment_len10": { | |
| "filename": "checkpoints/segment_len10.ckpt", | |
| "class": "SegmentTokenDiscriminator", | |
| "segment_len": 10, | |
| "vocab_size": 65536, | |
| "d_model": 256, | |
| "nhead": 8, | |
| "num_layers": 4, | |
| "dim_feedforward": 1024, | |
| "dropout": 0.1 | |
| } | |
| } | |