| { | |
| "model_name": "/gpfs/workdir/aswalda/CodeMixedRedTeaming/models/meta-llama/Meta-Llama-3-8B-Instruct", | |
| "output_dir": "/gpfs/workdir/aswalda/CodeMixedRedTeaming/models/aligned_model_new", | |
| "mode": "both", | |
| "freeze_through": 17, | |
| "align_layers": [ | |
| 18, | |
| 19, | |
| 20, | |
| 21, | |
| 22, | |
| 23, | |
| 24, | |
| 25, | |
| 26, | |
| 27, | |
| 28, | |
| 29, | |
| 30, | |
| 31, | |
| 32 | |
| ], | |
| "alpha": 1.0, | |
| "beta": 1.0, | |
| "temperature": 2.0, | |
| "use_safe": true, | |
| "val_split": 0.1, | |
| "max_length": 512, | |
| "batch_size": 8, | |
| "epochs": 3, | |
| "lr": 1e-05, | |
| "weight_decay": 0.01, | |
| "max_grad_norm": 1.0, | |
| "train_layers": [ | |
| 18, | |
| 19, | |
| 20, | |
| 21, | |
| 22, | |
| 23, | |
| 24, | |
| 25, | |
| 26, | |
| 27, | |
| 28, | |
| 29, | |
| 30, | |
| 31, | |
| 32 | |
| ], | |
| "n_train": 828, | |
| "n_val": 92 | |
| } |