Training in progress, step 150, checkpoint

Browse files

Files changed (7) hide show

last-checkpoint/adapter_config.json +2 -2
last-checkpoint/adapter_model.safetensors +1 -1
last-checkpoint/optimizer.pt +2 -2
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +2 -2
last-checkpoint/trainer_state.json +72 -524
last-checkpoint/training_args.bin +2 -2

last-checkpoint/adapter_config.json CHANGED Viewed

@@ -22,8 +22,8 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "q_proj",
-    "k_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "k_proj",
+    "q_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e509195daf848fcb63ff142e78b630faccf6e51fad01b6e3b473f7c9b81e1da0
 size 527048968

 version https://git-lfs.github.com/spec/v1
+oid sha256:1de9c7983d81c83a25d9f5af8ab2f633d7e6d24eec5b255ecd10994cf1de3e68
 size 527048968

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:44ecbc32e205dad7c9ef52f7e61a7eb02340bf5159e891c7a802a3da51f2db68
-size 1054136250

 version https://git-lfs.github.com/spec/v1
+oid sha256:d9b36b33638ac27ad81d5b5cd5fa2e56673b3a7acb5c226ff0baa60d122dfdc7
+size 1054135994

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d591cd4a87db6ff7862986fcbd71a7ea08ac34a6c4ca00eb88fbc6e4ccf1c5bd
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:afdcd158786234085082ce38b1824c51dd8c72881220443fc2d1c6f4e031a983
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f47df519d3e34f85833ffe9513be298918979811657719c019fec7ab68351e14
-size 1256

 version https://git-lfs.github.com/spec/v1
+oid sha256:11a68d93d91bb3affb76e357047e1fc6d0e0e337baf5ccbf0315ac19ab68b7ca
+size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,583 +1,131 @@
 {
-  "best_metric": 0.7210280299186707,
-  "best_model_checkpoint": "./output/checkpoint-750",
-  "epoch": 16.666666666666668,
   "eval_steps": 150,
-  "global_step": 750,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 0.2222222222222222,
-      "grad_norm": 1.9091473817825317,
-      "learning_rate": 2.9999999999999984e-06,
-      "loss": 0.6619,
       "step": 10
     },
     {
-      "epoch": 0.4444444444444444,
-      "grad_norm": 1.8889063596725464,
-      "learning_rate": 5.999999999999997e-06,
-      "loss": 0.7254,
       "step": 20
     },
     {
-      "epoch": 0.6666666666666666,
-      "grad_norm": 1.6717636585235596,
-      "learning_rate": 8.999999999999993e-06,
-      "loss": 0.7335,
       "step": 30
     },
     {
-      "epoch": 0.8888888888888888,
-      "grad_norm": 1.5766067504882812,
-      "learning_rate": 1.1999999999999994e-05,
-      "loss": 0.7377,
       "step": 40
     },
     {
-      "epoch": 1.1111111111111112,
-      "grad_norm": 1.2490640878677368,
-      "learning_rate": 1.499999999999999e-05,
-      "loss": 0.8942,
       "step": 50
     },
     {
-      "epoch": 1.3333333333333333,
-      "grad_norm": 1.1447882652282715,
-      "learning_rate": 1.7999999999999987e-05,
-      "loss": 0.7146,
       "step": 60
     },
     {
-      "epoch": 1.5555555555555556,
-      "grad_norm": 1.5109171867370605,
-      "learning_rate": 2.0999999999999985e-05,
-      "loss": 0.7579,
       "step": 70
     },
     {
-      "epoch": 1.7777777777777777,
-      "grad_norm": 1.8730992078781128,
-      "learning_rate": 2.3999999999999987e-05,
-      "loss": 0.707,
       "step": 80
     },
     {
-      "epoch": 2.0,
-      "grad_norm": 2.063655138015747,
-      "learning_rate": 2.6999999999999982e-05,
-      "loss": 0.7705,
       "step": 90
     },
     {
-      "epoch": 2.2222222222222223,
-      "grad_norm": 1.565353512763977,
-      "learning_rate": 2.999999999999998e-05,
-      "loss": 0.7273,
       "step": 100
     },
     {
-      "epoch": 2.4444444444444446,
-      "grad_norm": 1.701326608657837,
-      "learning_rate": 2.999999702723961e-05,
-      "loss": 0.7474,
       "step": 110
     },
     {
-      "epoch": 2.6666666666666665,
-      "grad_norm": 2.7937393188476562,
-      "learning_rate": 2.9999988108959667e-05,
-      "loss": 0.5701,
       "step": 120
     },
     {
-      "epoch": 2.888888888888889,
-      "grad_norm": 2.1285998821258545,
-      "learning_rate": 2.9999973245163695e-05,
-      "loss": 0.7044,
       "step": 130
     },
     {
-      "epoch": 3.111111111111111,
-      "grad_norm": 2.2441246509552,
-      "learning_rate": 2.999995243585758e-05,
-      "loss": 0.717,
       "step": 140
     },
     {
-      "epoch": 3.3333333333333335,
-      "grad_norm": 1.9379878044128418,
-      "learning_rate": 2.9999925681049573e-05,
-      "loss": 0.664,
       "step": 150
     },
     {
-      "epoch": 3.3333333333333335,
-      "eval_loss": 0.7682406902313232,
-      "eval_runtime": 0.4514,
-      "eval_samples_per_second": 22.155,
-      "eval_steps_per_second": 22.155,
       "step": 150
-    },
-    {
-      "epoch": 3.5555555555555554,
-      "grad_norm": 2.575423002243042,
-      "learning_rate": 2.9999892980750276e-05,
-      "loss": 0.6943,
-      "step": 160
-    },
-    {
-      "epoch": 3.7777777777777777,
-      "grad_norm": 2.392334222793579,
-      "learning_rate": 2.9999854334972655e-05,
-      "loss": 0.6922,
-      "step": 170
-    },
-    {
-      "epoch": 4.0,
-      "grad_norm": 2.5393826961517334,
-      "learning_rate": 2.999980974373202e-05,
-      "loss": 0.6677,
-      "step": 180
-    },
-    {
-      "epoch": 4.222222222222222,
-      "grad_norm": 1.6046398878097534,
-      "learning_rate": 2.9999759207046055e-05,
-      "loss": 0.5898,
-      "step": 190
-    },
-    {
-      "epoch": 4.444444444444445,
-      "grad_norm": 1.681414246559143,
-      "learning_rate": 2.9999702724934783e-05,
-      "loss": 0.7117,
-      "step": 200
-    },
-    {
-      "epoch": 4.666666666666667,
-      "grad_norm": 3.416290044784546,
-      "learning_rate": 2.99996402974206e-05,
-      "loss": 0.6278,
-      "step": 210
-    },
-    {
-      "epoch": 4.888888888888889,
-      "grad_norm": 2.0781354904174805,
-      "learning_rate": 2.9999571924528243e-05,
-      "loss": 0.6732,
-      "step": 220
-    },
-    {
-      "epoch": 5.111111111111111,
-      "grad_norm": 2.630134105682373,
-      "learning_rate": 2.9999497606284816e-05,
-      "loss": 0.6029,
-      "step": 230
-    },
-    {
-      "epoch": 5.333333333333333,
-      "grad_norm": 1.482037901878357,
-      "learning_rate": 2.9999417342719775e-05,
-      "loss": 0.6941,
-      "step": 240
-    },
-    {
-      "epoch": 5.555555555555555,
-      "grad_norm": 2.217900514602661,
-      "learning_rate": 2.9999331133864935e-05,
-      "loss": 0.6478,
-      "step": 250
-    },
-    {
-      "epoch": 5.777777777777778,
-      "grad_norm": 1.7131129503250122,
-      "learning_rate": 2.9999238979754465e-05,
-      "loss": 0.6095,
-      "step": 260
-    },
-    {
-      "epoch": 6.0,
-      "grad_norm": 1.908470869064331,
-      "learning_rate": 2.99991408804249e-05,
-      "loss": 0.5758,
-      "step": 270
-    },
-    {
-      "epoch": 6.222222222222222,
-      "grad_norm": 2.141641616821289,
-      "learning_rate": 2.999903683591511e-05,
-      "loss": 0.574,
-      "step": 280
-    },
-    {
-      "epoch": 6.444444444444445,
-      "grad_norm": 1.3931849002838135,
-      "learning_rate": 2.9998926846266345e-05,
-      "loss": 0.6139,
-      "step": 290
-    },
-    {
-      "epoch": 6.666666666666667,
-      "grad_norm": 2.278519868850708,
-      "learning_rate": 2.9998810911522193e-05,
-      "loss": 0.6227,
-      "step": 300
-    },
-    {
-      "epoch": 6.666666666666667,
-      "eval_loss": 0.7388573884963989,
-      "eval_runtime": 0.4661,
-      "eval_samples_per_second": 21.453,
-      "eval_steps_per_second": 21.453,
-      "step": 300
-    },
-    {
-      "epoch": 6.888888888888889,
-      "grad_norm": 2.712602138519287,
-      "learning_rate": 2.9998689031728615e-05,
-      "loss": 0.6479,
-      "step": 310
-    },
-    {
-      "epoch": 7.111111111111111,
-      "grad_norm": 1.7634906768798828,
-      "learning_rate": 2.9998561206933918e-05,
-      "loss": 0.5863,
-      "step": 320
-    },
-    {
-      "epoch": 7.333333333333333,
-      "grad_norm": 1.772024154663086,
-      "learning_rate": 2.9998427437188766e-05,
-      "loss": 0.5795,
-      "step": 330
-    },
-    {
-      "epoch": 7.555555555555555,
-      "grad_norm": 2.34784197807312,
-      "learning_rate": 2.999828772254618e-05,
-      "loss": 0.6034,
-      "step": 340
-    },
-    {
-      "epoch": 7.777777777777778,
-      "grad_norm": 2.455519199371338,
-      "learning_rate": 2.9998142063061544e-05,
-      "loss": 0.6625,
-      "step": 350
-    },
-    {
-      "epoch": 8.0,
-      "grad_norm": 1.3227782249450684,
-      "learning_rate": 2.9997990458792583e-05,
-      "loss": 0.6041,
-      "step": 360
-    },
-    {
-      "epoch": 8.222222222222221,
-      "grad_norm": 1.9034490585327148,
-      "learning_rate": 2.9997832909799397e-05,
-      "loss": 0.5491,
-      "step": 370
-    },
-    {
-      "epoch": 8.444444444444445,
-      "grad_norm": 1.9352225065231323,
-      "learning_rate": 2.9997669416144432e-05,
-      "loss": 0.6406,
-      "step": 380
-    },
-    {
-      "epoch": 8.666666666666666,
-      "grad_norm": 1.0488076210021973,
-      "learning_rate": 2.999749997789249e-05,
-      "loss": 0.5398,
-      "step": 390
-    },
-    {
-      "epoch": 8.88888888888889,
-      "grad_norm": 1.5216209888458252,
-      "learning_rate": 2.9997324595110723e-05,
-      "loss": 0.6545,
-      "step": 400
-    },
-    {
-      "epoch": 9.11111111111111,
-      "grad_norm": 1.3843863010406494,
-      "learning_rate": 2.9997143267868663e-05,
-      "loss": 0.5948,
-      "step": 410
-    },
-    {
-      "epoch": 9.333333333333334,
-      "grad_norm": 2.4701507091522217,
-      "learning_rate": 2.999695599623817e-05,
-      "loss": 0.6224,
-      "step": 420
-    },
-    {
-      "epoch": 9.555555555555555,
-      "grad_norm": 2.598496198654175,
-      "learning_rate": 2.9996762780293483e-05,
-      "loss": 0.575,
-      "step": 430
-    },
-    {
-      "epoch": 9.777777777777779,
-      "grad_norm": 1.5249278545379639,
-      "learning_rate": 2.9996563620111176e-05,
-      "loss": 0.5294,
-      "step": 440
-    },
-    {
-      "epoch": 10.0,
-      "grad_norm": 1.3830034732818604,
-      "learning_rate": 2.9996358515770198e-05,
-      "loss": 0.5417,
-      "step": 450
-    },
-    {
-      "epoch": 10.0,
-      "eval_loss": 0.726381778717041,
-      "eval_runtime": 0.4056,
-      "eval_samples_per_second": 24.653,
-      "eval_steps_per_second": 24.653,
-      "step": 450
-    },
-    {
-      "epoch": 10.222222222222221,
-      "grad_norm": 2.226635456085205,
-      "learning_rate": 2.9996147467351836e-05,
-      "loss": 0.506,
-      "step": 460
-    },
-    {
-      "epoch": 10.444444444444445,
-      "grad_norm": 1.4145069122314453,
-      "learning_rate": 2.9995930474939753e-05,
-      "loss": 0.4908,
-      "step": 470
-    },
-    {
-      "epoch": 10.666666666666666,
-      "grad_norm": 1.9364039897918701,
-      "learning_rate": 2.9995707538619954e-05,
-      "loss": 0.6364,
-      "step": 480
-    },
-    {
-      "epoch": 10.88888888888889,
-      "grad_norm": 2.14816951751709,
-      "learning_rate": 2.9995478658480802e-05,
-      "loss": 0.5532,
-      "step": 490
-    },
-    {
-      "epoch": 11.11111111111111,
-      "grad_norm": 1.8744515180587769,
-      "learning_rate": 2.9995243834613023e-05,
-      "loss": 0.5234,
-      "step": 500
-    },
-    {
-      "epoch": 11.333333333333334,
-      "grad_norm": 1.6773265600204468,
-      "learning_rate": 2.9995003067109687e-05,
-      "loss": 0.5392,
-      "step": 510
-    },
-    {
-      "epoch": 11.555555555555555,
-      "grad_norm": 2.6416842937469482,
-      "learning_rate": 2.9994756356066226e-05,
-      "loss": 0.5848,
-      "step": 520
-    },
-    {
-      "epoch": 11.777777777777779,
-      "grad_norm": 2.257610321044922,
-      "learning_rate": 2.999450370158044e-05,
-      "loss": 0.5336,
-      "step": 530
-    },
-    {
-      "epoch": 12.0,
-      "grad_norm": 1.5329607725143433,
-      "learning_rate": 2.9994245103752457e-05,
-      "loss": 0.5242,
-      "step": 540
-    },
-    {
-      "epoch": 12.222222222222221,
-      "grad_norm": 1.2473564147949219,
-      "learning_rate": 2.999398056268479e-05,
-      "loss": 0.5356,
-      "step": 550
-    },
-    {
-      "epoch": 12.444444444444445,
-      "grad_norm": 1.4698841571807861,
-      "learning_rate": 2.9993710078482286e-05,
-      "loss": 0.4155,
-      "step": 560
-    },
-    {
-      "epoch": 12.666666666666666,
-      "grad_norm": 3.38484525680542,
-      "learning_rate": 2.9993433651252164e-05,
-      "loss": 0.6201,
-      "step": 570
-    },
-    {
-      "epoch": 12.88888888888889,
-      "grad_norm": 1.4733773469924927,
-      "learning_rate": 2.9993151281103986e-05,
-      "loss": 0.5349,
-      "step": 580
-    },
-    {
-      "epoch": 13.11111111111111,
-      "grad_norm": 2.4409337043762207,
-      "learning_rate": 2.9992862968149675e-05,
-      "loss": 0.4179,
-      "step": 590
-    },
-    {
-      "epoch": 13.333333333333334,
-      "grad_norm": 2.4499781131744385,
-      "learning_rate": 2.9992568712503513e-05,
-      "loss": 0.5321,
-      "step": 600
-    },
-    {
-      "epoch": 13.333333333333334,
-      "eval_loss": 0.7211434841156006,
-      "eval_runtime": 0.4323,
-      "eval_samples_per_second": 23.134,
-      "eval_steps_per_second": 23.134,
-      "step": 600
-    },
-    {
-      "epoch": 13.555555555555555,
-      "grad_norm": 2.347456455230713,
-      "learning_rate": 2.9992268514282122e-05,
-      "loss": 0.5653,
-      "step": 610
-    },
-    {
-      "epoch": 13.777777777777779,
-      "grad_norm": 2.2229528427124023,
-      "learning_rate": 2.99919623736045e-05,
-      "loss": 0.4408,
-      "step": 620
-    },
-    {
-      "epoch": 14.0,
-      "grad_norm": 2.275893449783325,
-      "learning_rate": 2.9991650290591996e-05,
-      "loss": 0.6037,
-      "step": 630
-    },
-    {
-      "epoch": 14.222222222222221,
-      "grad_norm": 2.250699520111084,
-      "learning_rate": 2.99913322653683e-05,
-      "loss": 0.4922,
-      "step": 640
-    },
-    {
-      "epoch": 14.444444444444445,
-      "grad_norm": 1.8398470878601074,
-      "learning_rate": 2.9991008298059473e-05,
-      "loss": 0.5012,
-      "step": 650
-    },
-    {
-      "epoch": 14.666666666666666,
-      "grad_norm": 1.539143443107605,
-      "learning_rate": 2.9990678388793924e-05,
-      "loss": 0.5321,
-      "step": 660
-    },
-    {
-      "epoch": 14.88888888888889,
-      "grad_norm": 1.2890745401382446,
-      "learning_rate": 2.999034253770242e-05,
-      "loss": 0.4581,
-      "step": 670
-    },
-    {
-      "epoch": 15.11111111111111,
-      "grad_norm": 2.539614200592041,
-      "learning_rate": 2.9990000744918076e-05,
-      "loss": 0.4486,
-      "step": 680
-    },
-    {
-      "epoch": 15.333333333333334,
-      "grad_norm": 1.6030837297439575,
-      "learning_rate": 2.9989653010576372e-05,
-      "loss": 0.4528,
-      "step": 690
-    },
-    {
-      "epoch": 15.555555555555555,
-      "grad_norm": 1.46444571018219,
-      "learning_rate": 2.9989299334815138e-05,
-      "loss": 0.4805,
-      "step": 700
-    },
-    {
-      "epoch": 15.777777777777779,
-      "grad_norm": 2.233593702316284,
-      "learning_rate": 2.9988939717774558e-05,
-      "loss": 0.5241,
-      "step": 710
-    },
-    {
-      "epoch": 16.0,
-      "grad_norm": 1.3459173440933228,
-      "learning_rate": 2.9988574159597174e-05,
-      "loss": 0.5107,
-      "step": 720
-    },
-    {
-      "epoch": 16.22222222222222,
-      "grad_norm": 2.139714241027832,
-      "learning_rate": 2.9988202660427887e-05,
-      "loss": 0.4647,
-      "step": 730
-    },
-    {
-      "epoch": 16.444444444444443,
-      "grad_norm": 3.066899061203003,
-      "learning_rate": 2.9987825220413937e-05,
-      "loss": 0.5351,
-      "step": 740
-    },
-    {
-      "epoch": 16.666666666666668,
-      "grad_norm": 1.896189570426941,
-      "learning_rate": 2.998744183970494e-05,
-      "loss": 0.4269,
-      "step": 750
-    },
-    {
-      "epoch": 16.666666666666668,
-      "eval_loss": 0.7210280299186707,
-      "eval_runtime": 0.4276,
-      "eval_samples_per_second": 23.389,
-      "eval_steps_per_second": 23.389,
-      "step": 750
     }
   ],
   "logging_steps": 10,
   "max_steps": 50000,
   "num_input_tokens_seen": 0,
-  "num_train_epochs": 1112,
   "save_steps": 150,
   "stateful_callbacks": {
     "TrainerControl": {
@@ -591,8 +139,8 @@
       "attributes": {}
     }
   },
-  "total_flos": 7981049240027136.0,
-  "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null
 }

 {
+  "best_metric": 0.7480350136756897,
+  "best_model_checkpoint": "./output/checkpoint-150",
+  "epoch": 6.521739130434782,
   "eval_steps": 150,
+  "global_step": 150,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 0.43478260869565216,
+      "grad_norm": 1.5022108554840088,
+      "learning_rate": 5e-06,
+      "loss": 0.9063,
       "step": 10
     },
     {
+      "epoch": 0.8695652173913043,
+      "grad_norm": 1.679484248161316,
+      "learning_rate": 1e-05,
+      "loss": 0.9018,
       "step": 20
     },
     {
+      "epoch": 1.3043478260869565,
+      "grad_norm": 1.7071681022644043,
+      "learning_rate": 1.5e-05,
+      "loss": 0.8972,
       "step": 30
     },
     {
+      "epoch": 1.7391304347826086,
+      "grad_norm": 1.4155817031860352,
+      "learning_rate": 2e-05,
+      "loss": 0.9019,
       "step": 40
     },
     {
+      "epoch": 2.1739130434782608,
+      "grad_norm": 1.2699992656707764,
+      "learning_rate": 2.5e-05,
+      "loss": 0.8208,
       "step": 50
     },
     {
+      "epoch": 2.608695652173913,
+      "grad_norm": 1.902714729309082,
+      "learning_rate": 3e-05,
+      "loss": 0.865,
       "step": 60
     },
     {
+      "epoch": 3.0434782608695654,
+      "grad_norm": 1.344117283821106,
+      "learning_rate": 3.5e-05,
+      "loss": 0.853,
       "step": 70
     },
     {
+      "epoch": 3.4782608695652173,
+      "grad_norm": 1.6205377578735352,
+      "learning_rate": 4e-05,
+      "loss": 0.774,
       "step": 80
     },
     {
+      "epoch": 3.9130434782608696,
+      "grad_norm": 1.364487886428833,
+      "learning_rate": 4.5e-05,
+      "loss": 0.8004,
       "step": 90
     },
     {
+      "epoch": 4.3478260869565215,
+      "grad_norm": 1.2991905212402344,
+      "learning_rate": 5e-05,
+      "loss": 0.7915,
       "step": 100
     },
     {
+      "epoch": 4.782608695652174,
+      "grad_norm": 2.0769360065460205,
+      "learning_rate": 4.999999504539938e-05,
+      "loss": 0.7423,
       "step": 110
     },
     {
+      "epoch": 5.217391304347826,
+      "grad_norm": 1.0391877889633179,
+      "learning_rate": 4.999998018159948e-05,
+      "loss": 0.6799,
       "step": 120
     },
     {
+      "epoch": 5.6521739130434785,
+      "grad_norm": 1.4947184324264526,
+      "learning_rate": 4.999995540860619e-05,
+      "loss": 0.6506,
       "step": 130
     },
     {
+      "epoch": 6.086956521739131,
+      "grad_norm": 1.8294117450714111,
+      "learning_rate": 4.999992072642933e-05,
+      "loss": 0.6741,
       "step": 140
     },
     {
+      "epoch": 6.521739130434782,
+      "grad_norm": 1.1097073554992676,
+      "learning_rate": 4.9999876135082656e-05,
+      "loss": 0.6923,
       "step": 150
     },
     {
+      "epoch": 6.521739130434782,
+      "eval_loss": 0.7480350136756897,
+      "eval_runtime": 0.5268,
+      "eval_samples_per_second": 18.983,
+      "eval_steps_per_second": 18.983,
       "step": 150
     }
   ],
   "logging_steps": 10,
   "max_steps": 50000,
   "num_input_tokens_seen": 0,
+  "num_train_epochs": 2174,
   "save_steps": 150,
   "stateful_callbacks": {
     "TrainerControl": {
       "attributes": {}
     }
   },
+  "total_flos": 3894839614291968.0,
+  "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null
 }

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:68671d3a40b312e8c641605c2dc5233644a3f074e034d0d6789a3fdd173db03a
-size 5496

 version https://git-lfs.github.com/spec/v1
+oid sha256:c534cfc3e2dd38ea6fb24a33807c3d741b1e0c48890f1270e8024ad58bfd114d
+size 5368