| { | |
| "architectures": [ | |
| "BertRegressor" | |
| ], | |
| "base_model": "bert-base-uncased", | |
| "num_hidden_layers": 3, | |
| "hidden_size": 768, | |
| "head": "Linear(768, 1)", | |
| "task": "regression", | |
| "output_range": [ | |
| 1.0, | |
| 6.0 | |
| ], | |
| "cefr_mapping": { | |
| "A1": 1, | |
| "A2": 2, | |
| "B1": 3, | |
| "B2": 4, | |
| "C1": 5, | |
| "C2": 6 | |
| }, | |
| "max_length": 128, | |
| "tokenizer": "bert-base-uncased", | |
| "training_config": { | |
| "csv_path": "data/processed/ace_cefr_labeled.csv", | |
| "output_dir": "checkpoints/reproduce", | |
| "model_name": "bert-base-uncased", | |
| "num_layers": 3, | |
| "max_length": 128, | |
| "lr": 6e-05, | |
| "epochs": 12, | |
| "batch_size": 32, | |
| "warmup_ratio": 0.1, | |
| "weight_decay": 0.01, | |
| "max_grad_norm": 1.0, | |
| "num_workers": 2, | |
| "seed": 42 | |
| }, | |
| "test_results": { | |
| "final_epoch_test_mse": 0.5775573253631592, | |
| "final_epoch_test_mae": 0.5508898496627808, | |
| "best_test_mse": 0.5665906071662903, | |
| "history": [ | |
| { | |
| "epoch": 1, | |
| "train_loss": 12.465281147903271, | |
| "test_mse": 6.588264465332031, | |
| "test_mae": 2.1838321685791016 | |
| }, | |
| { | |
| "epoch": 2, | |
| "train_loss": 2.5425199029150973, | |
| "test_mse": 1.0636351108551025, | |
| "test_mae": 0.8281134366989136 | |
| }, | |
| { | |
| "epoch": 3, | |
| "train_loss": 0.9577709433737766, | |
| "test_mse": 1.0986764430999756, | |
| "test_mae": 0.8498026132583618 | |
| }, | |
| { | |
| "epoch": 4, | |
| "train_loss": 0.6925251134995664, | |
| "test_mse": 0.7558661699295044, | |
| "test_mae": 0.6341950297355652 | |
| }, | |
| { | |
| "epoch": 5, | |
| "train_loss": 0.4300207313526882, | |
| "test_mse": 0.573773205280304, | |
| "test_mae": 0.5825716257095337 | |
| }, | |
| { | |
| "epoch": 6, | |
| "train_loss": 0.34610338934351886, | |
| "test_mse": 0.5665906071662903, | |
| "test_mae": 0.5687209367752075 | |
| }, | |
| { | |
| "epoch": 7, | |
| "train_loss": 0.25567558910069843, | |
| "test_mse": 0.6220540404319763, | |
| "test_mae": 0.5755833983421326 | |
| }, | |
| { | |
| "epoch": 8, | |
| "train_loss": 0.17715133244401954, | |
| "test_mse": 0.6116251945495605, | |
| "test_mae": 0.5671263337135315 | |
| }, | |
| { | |
| "epoch": 9, | |
| "train_loss": 0.1541851587509841, | |
| "test_mse": 0.6381506323814392, | |
| "test_mae": 0.5819261074066162 | |
| }, | |
| { | |
| "epoch": 10, | |
| "train_loss": 0.13355727959214972, | |
| "test_mse": 0.5858347415924072, | |
| "test_mae": 0.5533825755119324 | |
| }, | |
| { | |
| "epoch": 11, | |
| "train_loss": 0.1009212305371681, | |
| "test_mse": 0.5986077189445496, | |
| "test_mae": 0.5595420002937317 | |
| }, | |
| { | |
| "epoch": 12, | |
| "train_loss": 0.08693857780668172, | |
| "test_mse": 0.5775573253631592, | |
| "test_mae": 0.5508898496627808 | |
| } | |
| ], | |
| "paper_targets": { | |
| "bert_baseline": 0.44, | |
| "bert_with_llm_pretrain": 0.37, | |
| "human_expert": 0.75 | |
| } | |
| }, | |
| "selected_state": "best_test_mse_epoch" | |
| } |