| { | |
| "epochs": 20, | |
| "batch_size": 8, | |
| "learning_rate": 1e-05, | |
| "base_dir": "/shared/nas2/ph16/toxic/outputs/classifier", | |
| "data_dir": "/shared/nas2/ph16/toxic/outputs/states/Ministral-8B-Instruct-2410", | |
| "job_name": "Ministral-8B-Instruct-2410_both/layer36", | |
| "ckpt": "", | |
| "gpu": "", | |
| "wandb": false, | |
| "overwrite": true, | |
| "hidden_sizes": [ | |
| "64" | |
| ], | |
| "random_seed": 42, | |
| "token_rule": "last", | |
| "label": "both", | |
| "n_decode": 0, | |
| "layer_id": 36, | |
| "num_classification": 2, | |
| "neg_weight": 1.0, | |
| "llm": "Ministral-8B-Instruct-2410" | |
| } |