| { | |
| "model": "phi2-mental-health", | |
| "base_model": "microsoft/phi-2", | |
| "dataset": "ShenLab/MentalChat16K", | |
| "lora_config": { | |
| "rank": 16, | |
| "alpha": 32, | |
| "target_modules": [ | |
| "q_proj", | |
| "k_proj", | |
| "v_proj", | |
| "dense" | |
| ], | |
| "dropout": 0.1 | |
| }, | |
| "training": { | |
| "final_train_loss": 0.7486542798042297, | |
| "total_steps": 2500, | |
| "epochs": 4, | |
| "learning_rate": 0.0002, | |
| "per_device_batch_size": 4, | |
| "gradient_accumulation": 2 | |
| }, | |
| "evaluation": { | |
| "eval_loss": 0.7297702431678772, | |
| "eval_runtime": 4064.1661, | |
| "eval_samples_per_second": 0.116, | |
| "eval_steps_per_second": 0.029, | |
| "epoch": 3.7397157816005984 | |
| }, | |
| "test_eval": { | |
| "eval_loss": 0.7111775875091553, | |
| "eval_runtime": 39.2705, | |
| "eval_samples_per_second": 12.019, | |
| "eval_steps_per_second": 3.005, | |
| "epoch": 3.7397157816005984 | |
| }, | |
| "dataset_stats": { | |
| "train_size": 5347, | |
| "val_size": 472, | |
| "test_size": 472 | |
| } | |
| } |