{ "task": "A", "train_result": { "train_runtime": 89.8415, "train_samples_per_second": 55.654, "train_steps_per_second": 3.506, "total_flos": 1429776675840000.0, "train_loss": 0.30868880862281434, "epoch": 5.0 }, "eval_result": { "eval_loss": 0.0931851789355278, "eval_accuracy": 0.971, "eval_precision": 0.9110169491525424, "eval_recall": 0.9641255605381166, "eval_specificity": 0.972972972972973, "eval_f1": 0.9368191721132898, "eval_auc": 0.9902955485915127, "eval_pr_auc": 0.9779863735053174, "eval_mcc": 0.9186403523498589, "eval_balanced_accuracy": 0.9685492667555449, "eval_runtime": 3.9437, "eval_samples_per_second": 253.57, "eval_steps_per_second": 8.114, "epoch": 5.0 }, "config": { "task": "A", "base_model": "microsoft/codebert-base", "num_labels": 2, "stylometric_dim": 32, "num_gpad_layers": 1, "entropy_alpha": 0.1, "max_length": 512, "use_stylometric": true, "num_epochs": 5, "train_batch_size": 16, "eval_batch_size": 32, "learning_rate": 2e-05, "weight_decay": 0.01, "warmup_ratio": 0.1, "max_grad_norm": 1.0, "gradient_accumulation_steps": 1, "use_mixed_precision": true, "use_gradient_checkpointing": true, "val_split": 0.2, "sample_size": null, "output_dir": "./gpad2_results_taskA_taska", "log_interval": 100, "save_strategy": "steps", "save_steps": 500, "eval_strategy": "steps", "eval_steps": 500, "early_stopping_patience": 3, "seed": 42, "use_wandb": false, "wandb_project": "gpad2_taska", "wandb_run_name": null, "push_to_hub": true, "hub_model_id": "ranjan56cse/gpad2-taska_smpl", "hub_token": null, "hub_private_repo": false } }