| { | |
| "model_type": "transformer", | |
| "architectures": ["TransformerLanguageModel"], | |
| "vocab_size": 65, | |
| "d_model": 256, | |
| "nhead": 8, | |
| "num_layers": 6, | |
| "dropout": 0.2, | |
| "seq_length": 128, | |
| "dim_feedforward": 1024, | |
| "tokenizer_type": "character-level", | |
| "task": "text-generation", | |
| "language": "en", | |
| "dataset": "shakespeare", | |
| "training_epochs": 25, | |
| "training_loss": 0.937, | |
| "validation_loss": 0.629, | |
| "validation_accuracy": 0.799, | |
| "perplexity": 1.9, | |
| "framework": "pytorch", | |
| "license": "mit" | |
| } | |