gpad2-task-b / results.json
ranjan56cse's picture
Training complete - Task B
fa8f459 verified
{
"task": "B",
"train_result": {
"train_runtime": 63.5451,
"train_samples_per_second": 54.922,
"train_steps_per_second": 3.462,
"total_flos": 998021268971520.0,
"train_loss": 1.1348177476362749,
"epoch": 5.0
},
"eval_result": {
"eval_loss": 0.8116088509559631,
"eval_accuracy": 0.7535816618911175,
"eval_precision": 0.6650326670418545,
"eval_recall": 0.7535816618911175,
"eval_specificity": NaN,
"eval_f1": 0.6942659022778552,
"eval_auc": NaN,
"eval_pr_auc": NaN,
"eval_mcc": 0.4826800602055998,
"eval_balanced_accuracy": 0.20106890227872526,
"eval_runtime": 2.8095,
"eval_samples_per_second": 248.44,
"eval_steps_per_second": 7.83,
"epoch": 5.0
},
"config": {
"task": "B",
"base_model": "microsoft/codebert-base",
"num_labels": 11,
"stylometric_dim": 32,
"num_gpad_layers": 1,
"entropy_alpha": 0.1,
"max_length": 512,
"use_stylometric": true,
"num_epochs": 5,
"train_batch_size": 16,
"eval_batch_size": 32,
"learning_rate": 2e-05,
"weight_decay": 0.01,
"warmup_ratio": 0.1,
"max_grad_norm": 1.0,
"gradient_accumulation_steps": 1,
"use_mixed_precision": true,
"use_gradient_checkpointing": true,
"val_split": 0.2,
"sample_size": null,
"output_dir": "./gpad2_results_taskB_taskb",
"log_interval": 100,
"save_strategy": "steps",
"save_steps": 500,
"eval_strategy": "steps",
"eval_steps": 500,
"early_stopping_patience": 3,
"seed": 42,
"use_wandb": false,
"wandb_project": "gpad2_taskb",
"wandb_run_name": null,
"push_to_hub": true,
"hub_model_id": "ranjan56cse/gpad2-taskb_smpl",
"hub_token": null,
"hub_private_repo": false
}
}