gpad2-task-a / results.json
ranjan56cse's picture
Training complete - Task A
2670884 verified
{
"task": "A",
"train_result": {
"train_runtime": 89.8415,
"train_samples_per_second": 55.654,
"train_steps_per_second": 3.506,
"total_flos": 1429776675840000.0,
"train_loss": 0.30868880862281434,
"epoch": 5.0
},
"eval_result": {
"eval_loss": 0.0931851789355278,
"eval_accuracy": 0.971,
"eval_precision": 0.9110169491525424,
"eval_recall": 0.9641255605381166,
"eval_specificity": 0.972972972972973,
"eval_f1": 0.9368191721132898,
"eval_auc": 0.9902955485915127,
"eval_pr_auc": 0.9779863735053174,
"eval_mcc": 0.9186403523498589,
"eval_balanced_accuracy": 0.9685492667555449,
"eval_runtime": 3.9437,
"eval_samples_per_second": 253.57,
"eval_steps_per_second": 8.114,
"epoch": 5.0
},
"config": {
"task": "A",
"base_model": "microsoft/codebert-base",
"num_labels": 2,
"stylometric_dim": 32,
"num_gpad_layers": 1,
"entropy_alpha": 0.1,
"max_length": 512,
"use_stylometric": true,
"num_epochs": 5,
"train_batch_size": 16,
"eval_batch_size": 32,
"learning_rate": 2e-05,
"weight_decay": 0.01,
"warmup_ratio": 0.1,
"max_grad_norm": 1.0,
"gradient_accumulation_steps": 1,
"use_mixed_precision": true,
"use_gradient_checkpointing": true,
"val_split": 0.2,
"sample_size": null,
"output_dir": "./gpad2_results_taskA_taska",
"log_interval": 100,
"save_strategy": "steps",
"save_steps": 500,
"eval_strategy": "steps",
"eval_steps": 500,
"early_stopping_patience": 3,
"seed": 42,
"use_wandb": false,
"wandb_project": "gpad2_taska",
"wandb_run_name": null,
"push_to_hub": true,
"hub_model_id": "ranjan56cse/gpad2-taska_smpl",
"hub_token": null,
"hub_private_repo": false
}
}