dfm_model / checkpoint-1120 /trainer_state.json
vm24's picture
Upload folder using huggingface_hub
3baafd5 verified
{
"best_metric": 0.35881221294403076,
"best_model_checkpoint": "deepfake_vs_real_image_detection/checkpoint-1120",
"epoch": 70.0,
"eval_steps": 500,
"global_step": 1120,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.6946107784431138,
"eval_loss": 1.4309433698654175,
"eval_runtime": 4.3566,
"eval_samples_per_second": 76.666,
"eval_steps_per_second": 9.641,
"step": 16
},
{
"epoch": 2.0,
"eval_accuracy": 0.7035928143712575,
"eval_loss": 1.3571979999542236,
"eval_runtime": 4.4448,
"eval_samples_per_second": 75.144,
"eval_steps_per_second": 9.449,
"step": 32
},
{
"epoch": 3.0,
"eval_accuracy": 0.7095808383233533,
"eval_loss": 1.2381948232650757,
"eval_runtime": 4.5106,
"eval_samples_per_second": 74.048,
"eval_steps_per_second": 9.311,
"step": 48
},
{
"epoch": 4.0,
"eval_accuracy": 0.7485029940119761,
"eval_loss": 1.1571621894836426,
"eval_runtime": 4.3237,
"eval_samples_per_second": 77.249,
"eval_steps_per_second": 9.714,
"step": 64
},
{
"epoch": 5.0,
"eval_accuracy": 0.7544910179640718,
"eval_loss": 1.1075578927993774,
"eval_runtime": 4.3443,
"eval_samples_per_second": 76.883,
"eval_steps_per_second": 9.668,
"step": 80
},
{
"epoch": 6.0,
"eval_accuracy": 0.7544910179640718,
"eval_loss": 1.0685527324676514,
"eval_runtime": 4.4445,
"eval_samples_per_second": 75.149,
"eval_steps_per_second": 9.45,
"step": 96
},
{
"epoch": 7.0,
"eval_accuracy": 0.7574850299401198,
"eval_loss": 1.0224419832229614,
"eval_runtime": 4.3333,
"eval_samples_per_second": 77.078,
"eval_steps_per_second": 9.692,
"step": 112
},
{
"epoch": 8.0,
"eval_accuracy": 0.7604790419161677,
"eval_loss": 0.9735947847366333,
"eval_runtime": 4.4514,
"eval_samples_per_second": 75.033,
"eval_steps_per_second": 9.435,
"step": 128
},
{
"epoch": 9.0,
"eval_accuracy": 0.7634730538922155,
"eval_loss": 0.935190737247467,
"eval_runtime": 4.483,
"eval_samples_per_second": 74.504,
"eval_steps_per_second": 9.369,
"step": 144
},
{
"epoch": 10.0,
"eval_accuracy": 0.7574850299401198,
"eval_loss": 0.8989432454109192,
"eval_runtime": 4.3947,
"eval_samples_per_second": 76.0,
"eval_steps_per_second": 9.557,
"step": 160
},
{
"epoch": 11.0,
"eval_accuracy": 0.7514970059880239,
"eval_loss": 0.8565046787261963,
"eval_runtime": 4.4679,
"eval_samples_per_second": 74.755,
"eval_steps_per_second": 9.4,
"step": 176
},
{
"epoch": 12.0,
"eval_accuracy": 0.7634730538922155,
"eval_loss": 0.8191085457801819,
"eval_runtime": 4.4986,
"eval_samples_per_second": 74.245,
"eval_steps_per_second": 9.336,
"step": 192
},
{
"epoch": 13.0,
"eval_accuracy": 0.7634730538922155,
"eval_loss": 0.783191442489624,
"eval_runtime": 4.5843,
"eval_samples_per_second": 72.857,
"eval_steps_per_second": 9.162,
"step": 208
},
{
"epoch": 14.0,
"eval_accuracy": 0.7724550898203593,
"eval_loss": 0.7542709708213806,
"eval_runtime": 4.417,
"eval_samples_per_second": 75.617,
"eval_steps_per_second": 9.509,
"step": 224
},
{
"epoch": 15.0,
"eval_accuracy": 0.7694610778443114,
"eval_loss": 0.7199692130088806,
"eval_runtime": 4.401,
"eval_samples_per_second": 75.891,
"eval_steps_per_second": 9.543,
"step": 240
},
{
"epoch": 16.0,
"eval_accuracy": 0.7754491017964071,
"eval_loss": 0.6858012676239014,
"eval_runtime": 4.4254,
"eval_samples_per_second": 75.474,
"eval_steps_per_second": 9.491,
"step": 256
},
{
"epoch": 17.0,
"eval_accuracy": 0.7784431137724551,
"eval_loss": 0.6566184759140015,
"eval_runtime": 4.4216,
"eval_samples_per_second": 75.539,
"eval_steps_per_second": 9.499,
"step": 272
},
{
"epoch": 18.0,
"eval_accuracy": 0.7844311377245509,
"eval_loss": 0.628990650177002,
"eval_runtime": 4.4307,
"eval_samples_per_second": 75.383,
"eval_steps_per_second": 9.479,
"step": 288
},
{
"epoch": 19.0,
"eval_accuracy": 0.7844311377245509,
"eval_loss": 0.6014779210090637,
"eval_runtime": 4.3612,
"eval_samples_per_second": 76.584,
"eval_steps_per_second": 9.63,
"step": 304
},
{
"epoch": 20.0,
"eval_accuracy": 0.7904191616766467,
"eval_loss": 0.5828869938850403,
"eval_runtime": 4.3656,
"eval_samples_per_second": 76.508,
"eval_steps_per_second": 9.621,
"step": 320
},
{
"epoch": 21.0,
"eval_accuracy": 0.7904191616766467,
"eval_loss": 0.560990571975708,
"eval_runtime": 4.4037,
"eval_samples_per_second": 75.846,
"eval_steps_per_second": 9.538,
"step": 336
},
{
"epoch": 22.0,
"eval_accuracy": 0.7904191616766467,
"eval_loss": 0.5444124937057495,
"eval_runtime": 4.4206,
"eval_samples_per_second": 75.556,
"eval_steps_per_second": 9.501,
"step": 352
},
{
"epoch": 23.0,
"eval_accuracy": 0.7964071856287425,
"eval_loss": 0.5321463346481323,
"eval_runtime": 4.402,
"eval_samples_per_second": 75.875,
"eval_steps_per_second": 9.541,
"step": 368
},
{
"epoch": 24.0,
"eval_accuracy": 0.8023952095808383,
"eval_loss": 0.521594226360321,
"eval_runtime": 4.4337,
"eval_samples_per_second": 75.331,
"eval_steps_per_second": 9.473,
"step": 384
},
{
"epoch": 25.0,
"eval_accuracy": 0.8053892215568862,
"eval_loss": 0.5053771138191223,
"eval_runtime": 4.4563,
"eval_samples_per_second": 74.95,
"eval_steps_per_second": 9.425,
"step": 400
},
{
"epoch": 26.0,
"eval_accuracy": 0.8143712574850299,
"eval_loss": 0.4930258095264435,
"eval_runtime": 4.3955,
"eval_samples_per_second": 75.986,
"eval_steps_per_second": 9.555,
"step": 416
},
{
"epoch": 27.0,
"eval_accuracy": 0.811377245508982,
"eval_loss": 0.4849102795124054,
"eval_runtime": 4.4566,
"eval_samples_per_second": 74.945,
"eval_steps_per_second": 9.424,
"step": 432
},
{
"epoch": 28.0,
"eval_accuracy": 0.811377245508982,
"eval_loss": 0.47692808508872986,
"eval_runtime": 4.4557,
"eval_samples_per_second": 74.959,
"eval_steps_per_second": 9.426,
"step": 448
},
{
"epoch": 29.0,
"eval_accuracy": 0.8293413173652695,
"eval_loss": 0.46685636043548584,
"eval_runtime": 4.3405,
"eval_samples_per_second": 76.949,
"eval_steps_per_second": 9.676,
"step": 464
},
{
"epoch": 30.0,
"eval_accuracy": 0.8323353293413174,
"eval_loss": 0.45782506465911865,
"eval_runtime": 4.3468,
"eval_samples_per_second": 76.838,
"eval_steps_per_second": 9.662,
"step": 480
},
{
"epoch": 31.0,
"eval_accuracy": 0.8323353293413174,
"eval_loss": 0.44891008734703064,
"eval_runtime": 4.5111,
"eval_samples_per_second": 74.039,
"eval_steps_per_second": 9.31,
"step": 496
},
{
"epoch": 31.25,
"grad_norm": 3.9690632820129395,
"learning_rate": 8.098055790363483e-07,
"loss": 0.6987,
"step": 500
},
{
"epoch": 32.0,
"eval_accuracy": 0.8323353293413174,
"eval_loss": 0.4414936900138855,
"eval_runtime": 4.3863,
"eval_samples_per_second": 76.146,
"eval_steps_per_second": 9.575,
"step": 512
},
{
"epoch": 33.0,
"eval_accuracy": 0.8323353293413174,
"eval_loss": 0.435556560754776,
"eval_runtime": 4.3922,
"eval_samples_per_second": 76.043,
"eval_steps_per_second": 9.562,
"step": 528
},
{
"epoch": 34.0,
"eval_accuracy": 0.8323353293413174,
"eval_loss": 0.4296257793903351,
"eval_runtime": 4.3498,
"eval_samples_per_second": 76.785,
"eval_steps_per_second": 9.656,
"step": 544
},
{
"epoch": 35.0,
"eval_accuracy": 0.8323353293413174,
"eval_loss": 0.4240988492965698,
"eval_runtime": 4.3863,
"eval_samples_per_second": 76.146,
"eval_steps_per_second": 9.575,
"step": 560
},
{
"epoch": 36.0,
"eval_accuracy": 0.8353293413173652,
"eval_loss": 0.41868290305137634,
"eval_runtime": 4.4309,
"eval_samples_per_second": 75.38,
"eval_steps_per_second": 9.479,
"step": 576
},
{
"epoch": 37.0,
"eval_accuracy": 0.8383233532934131,
"eval_loss": 0.413825124502182,
"eval_runtime": 4.3459,
"eval_samples_per_second": 76.853,
"eval_steps_per_second": 9.664,
"step": 592
},
{
"epoch": 38.0,
"eval_accuracy": 0.8413173652694611,
"eval_loss": 0.4092709720134735,
"eval_runtime": 4.353,
"eval_samples_per_second": 76.728,
"eval_steps_per_second": 9.648,
"step": 608
},
{
"epoch": 39.0,
"eval_accuracy": 0.8413173652694611,
"eval_loss": 0.40586671233177185,
"eval_runtime": 4.3701,
"eval_samples_per_second": 76.429,
"eval_steps_per_second": 9.611,
"step": 624
},
{
"epoch": 40.0,
"eval_accuracy": 0.8502994011976048,
"eval_loss": 0.401659220457077,
"eval_runtime": 4.4026,
"eval_samples_per_second": 75.864,
"eval_steps_per_second": 9.54,
"step": 640
},
{
"epoch": 41.0,
"eval_accuracy": 0.8502994011976048,
"eval_loss": 0.3979702293872833,
"eval_runtime": 4.5672,
"eval_samples_per_second": 73.13,
"eval_steps_per_second": 9.196,
"step": 656
},
{
"epoch": 42.0,
"eval_accuracy": 0.8502994011976048,
"eval_loss": 0.3946226239204407,
"eval_runtime": 4.3743,
"eval_samples_per_second": 76.354,
"eval_steps_per_second": 9.601,
"step": 672
},
{
"epoch": 43.0,
"eval_accuracy": 0.8473053892215568,
"eval_loss": 0.39317673444747925,
"eval_runtime": 4.3247,
"eval_samples_per_second": 77.23,
"eval_steps_per_second": 9.712,
"step": 688
},
{
"epoch": 44.0,
"eval_accuracy": 0.8473053892215568,
"eval_loss": 0.389418363571167,
"eval_runtime": 4.4405,
"eval_samples_per_second": 75.216,
"eval_steps_per_second": 9.458,
"step": 704
},
{
"epoch": 45.0,
"eval_accuracy": 0.8473053892215568,
"eval_loss": 0.3862323462963104,
"eval_runtime": 4.3815,
"eval_samples_per_second": 76.23,
"eval_steps_per_second": 9.586,
"step": 720
},
{
"epoch": 46.0,
"eval_accuracy": 0.8502994011976048,
"eval_loss": 0.384316086769104,
"eval_runtime": 4.4286,
"eval_samples_per_second": 75.42,
"eval_steps_per_second": 9.484,
"step": 736
},
{
"epoch": 47.0,
"eval_accuracy": 0.844311377245509,
"eval_loss": 0.383512943983078,
"eval_runtime": 4.4251,
"eval_samples_per_second": 75.479,
"eval_steps_per_second": 9.491,
"step": 752
},
{
"epoch": 48.0,
"eval_accuracy": 0.8622754491017964,
"eval_loss": 0.3795510232448578,
"eval_runtime": 4.4626,
"eval_samples_per_second": 74.844,
"eval_steps_per_second": 9.412,
"step": 768
},
{
"epoch": 49.0,
"eval_accuracy": 0.8592814371257484,
"eval_loss": 0.3759188950061798,
"eval_runtime": 4.3421,
"eval_samples_per_second": 76.921,
"eval_steps_per_second": 9.673,
"step": 784
},
{
"epoch": 50.0,
"eval_accuracy": 0.8652694610778443,
"eval_loss": 0.37549516558647156,
"eval_runtime": 4.4076,
"eval_samples_per_second": 75.778,
"eval_steps_per_second": 9.529,
"step": 800
},
{
"epoch": 51.0,
"eval_accuracy": 0.8622754491017964,
"eval_loss": 0.3745565414428711,
"eval_runtime": 4.466,
"eval_samples_per_second": 74.787,
"eval_steps_per_second": 9.404,
"step": 816
},
{
"epoch": 52.0,
"eval_accuracy": 0.8652694610778443,
"eval_loss": 0.37246376276016235,
"eval_runtime": 4.3519,
"eval_samples_per_second": 76.748,
"eval_steps_per_second": 9.651,
"step": 832
},
{
"epoch": 53.0,
"eval_accuracy": 0.8652694610778443,
"eval_loss": 0.36974743008613586,
"eval_runtime": 4.4116,
"eval_samples_per_second": 75.709,
"eval_steps_per_second": 9.52,
"step": 848
},
{
"epoch": 54.0,
"eval_accuracy": 0.874251497005988,
"eval_loss": 0.3688933253288269,
"eval_runtime": 4.373,
"eval_samples_per_second": 76.377,
"eval_steps_per_second": 9.604,
"step": 864
},
{
"epoch": 55.0,
"eval_accuracy": 0.874251497005988,
"eval_loss": 0.3665659427642822,
"eval_runtime": 4.3847,
"eval_samples_per_second": 76.173,
"eval_steps_per_second": 9.579,
"step": 880
},
{
"epoch": 56.0,
"eval_accuracy": 0.874251497005988,
"eval_loss": 0.3666609227657318,
"eval_runtime": 4.4937,
"eval_samples_per_second": 74.326,
"eval_steps_per_second": 9.346,
"step": 896
},
{
"epoch": 57.0,
"eval_accuracy": 0.8802395209580839,
"eval_loss": 0.366781622171402,
"eval_runtime": 4.4056,
"eval_samples_per_second": 75.812,
"eval_steps_per_second": 9.533,
"step": 912
},
{
"epoch": 58.0,
"eval_accuracy": 0.8802395209580839,
"eval_loss": 0.3661949932575226,
"eval_runtime": 4.4335,
"eval_samples_per_second": 75.336,
"eval_steps_per_second": 9.473,
"step": 928
},
{
"epoch": 59.0,
"eval_accuracy": 0.8802395209580839,
"eval_loss": 0.36339056491851807,
"eval_runtime": 4.4117,
"eval_samples_per_second": 75.708,
"eval_steps_per_second": 9.52,
"step": 944
},
{
"epoch": 60.0,
"eval_accuracy": 0.8772455089820359,
"eval_loss": 0.36299723386764526,
"eval_runtime": 4.4436,
"eval_samples_per_second": 75.165,
"eval_steps_per_second": 9.452,
"step": 960
},
{
"epoch": 61.0,
"eval_accuracy": 0.8832335329341318,
"eval_loss": 0.3644971549510956,
"eval_runtime": 4.3789,
"eval_samples_per_second": 76.274,
"eval_steps_per_second": 9.591,
"step": 976
},
{
"epoch": 62.0,
"eval_accuracy": 0.8832335329341318,
"eval_loss": 0.3652717173099518,
"eval_runtime": 4.3124,
"eval_samples_per_second": 77.452,
"eval_steps_per_second": 9.739,
"step": 992
},
{
"epoch": 62.5,
"grad_norm": 1.597828984260559,
"learning_rate": 5.984784446322908e-07,
"loss": 0.1919,
"step": 1000
},
{
"epoch": 63.0,
"eval_accuracy": 0.8832335329341318,
"eval_loss": 0.3627488911151886,
"eval_runtime": 4.4759,
"eval_samples_per_second": 74.622,
"eval_steps_per_second": 9.384,
"step": 1008
},
{
"epoch": 64.0,
"eval_accuracy": 0.8772455089820359,
"eval_loss": 0.3642951548099518,
"eval_runtime": 4.4875,
"eval_samples_per_second": 74.428,
"eval_steps_per_second": 9.359,
"step": 1024
},
{
"epoch": 65.0,
"eval_accuracy": 0.874251497005988,
"eval_loss": 0.3665095567703247,
"eval_runtime": 4.39,
"eval_samples_per_second": 76.083,
"eval_steps_per_second": 9.567,
"step": 1040
},
{
"epoch": 66.0,
"eval_accuracy": 0.8772455089820359,
"eval_loss": 0.3633537292480469,
"eval_runtime": 4.4453,
"eval_samples_per_second": 75.135,
"eval_steps_per_second": 9.448,
"step": 1056
},
{
"epoch": 67.0,
"eval_accuracy": 0.8772455089820359,
"eval_loss": 0.36282193660736084,
"eval_runtime": 4.4608,
"eval_samples_per_second": 74.875,
"eval_steps_per_second": 9.415,
"step": 1072
},
{
"epoch": 68.0,
"eval_accuracy": 0.874251497005988,
"eval_loss": 0.36409279704093933,
"eval_runtime": 4.3878,
"eval_samples_per_second": 76.119,
"eval_steps_per_second": 9.572,
"step": 1088
},
{
"epoch": 69.0,
"eval_accuracy": 0.8772455089820359,
"eval_loss": 0.3623464107513428,
"eval_runtime": 4.4706,
"eval_samples_per_second": 74.711,
"eval_steps_per_second": 9.395,
"step": 1104
},
{
"epoch": 70.0,
"eval_accuracy": 0.8772455089820359,
"eval_loss": 0.35881221294403076,
"eval_runtime": 4.3641,
"eval_samples_per_second": 76.533,
"eval_steps_per_second": 9.624,
"step": 1120
}
],
"logging_steps": 500,
"max_steps": 2416,
"num_input_tokens_seen": 0,
"num_train_epochs": 151,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 2.71221963651072e+18,
"train_batch_size": 32,
"trial_name": null,
"trial_params": null
}