| { | |
| "model_type": "isrm-vae", | |
| "architecture": "distilbert-vae", | |
| "architecture_type": "dual-layer", | |
| "base_model": "distilbert-base-uncased", | |
| "latent_dim": 3, | |
| "hidden_dim": 768, | |
| "num_layers": 6, | |
| "num_unfrozen_layers": 2, | |
| "pad_dimensions": [ | |
| "pleasure", | |
| "arousal", | |
| "dominance" | |
| ], | |
| "bdi_dimensions": [ | |
| "belief", | |
| "goal", | |
| "intention", | |
| "ambiguity", | |
| "social" | |
| ], | |
| "pad_layer": 10, | |
| "bdi_layer": 19, | |
| "task": "affective-state-encoding", | |
| "training": { | |
| "dataset_size": 1500, | |
| "epochs": 15, | |
| "optimizer": "AdamW", | |
| "learning_rate": 2e-05, | |
| "loss_fn": "MSE + KL divergence", | |
| "kl_weight": 0.001, | |
| "final_mse": 0.018, | |
| "final_kld": 0.003 | |
| } | |
| } |