Upload folder using huggingface_hub

Files changed (10) hide show

checkpoint-25/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6a42f0dfd4f35726809bedde33d43533382f05320f51b34559ecd66a6ab4a95e
 size 3096165928

 version https://git-lfs.github.com/spec/v1
+oid sha256:1b7f81ce579291f35875ee78d87e54977deb1632985cbffd19debfc87c16f319
 size 3096165928

checkpoint-25/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6a019a20f8d1b33458efcd6e1f31b87ea5952b2ebfe815c5567bf655d0ab6514
 size 6192618087

 version https://git-lfs.github.com/spec/v1
+oid sha256:7094b0c32b0faa650ffcabfbe4735ee60882c6777682a46b78575578f97c45fd
 size 6192618087

checkpoint-25/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:455bb13072703b4695b8fce97607013bd45e6425447d095dda8121451f9cfe1d
 size 1465

 version https://git-lfs.github.com/spec/v1
+oid sha256:e1f60de87fc4b9114f17c73a8e4d7386c49c9ed3c3573c42fb30bcaad96a4b33
 size 1465

checkpoint-25/tokenizer.json CHANGED Viewed

@@ -1,21 +1,7 @@
 {
   "version": "1.0",
-  "truncation": {
-    "direction": "Right",
-    "max_length": 768,
-    "strategy": "LongestFirst",
-    "stride": 0
-  },
-  "padding": {
-    "strategy": {
-      "Fixed": 768
-    },
-    "direction": "Right",
-    "pad_to_multiple_of": null,
-    "pad_id": 50256,
-    "pad_type_id": 0,
-    "pad_token": "<|endoftext|>"
-  },
   "added_tokens": [
     {
       "id": 50256,

 {
   "version": "1.0",
+  "truncation": null,
+  "padding": null,
   "added_tokens": [
     {
       "id": 50256,

checkpoint-25/trainer_state.json CHANGED Viewed

@@ -9,26 +9,19 @@
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
-    {
-      "epoch": 0.4,
-      "grad_norm": 19.882919311523438,
-      "learning_rate": 8e-07,
-      "loss": 8.5763,
-      "step": 10
-    },
     {
       "epoch": 0.8,
-      "grad_norm": 10.610285758972168,
-      "learning_rate": 3e-07,
-      "loss": 8.2046,
       "step": 20
     }
   ],
-  "logging_steps": 10,
   "max_steps": 25,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 1,
-  "save_steps": 50,
   "stateful_callbacks": {
     "TrainerControl": {
       "args": {

   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
       "epoch": 0.8,
+      "grad_norm": 11.499434471130371,
+      "learning_rate": 2.608695652173913e-09,
+      "loss": 8.5489,
       "step": 20
     }
   ],
+  "logging_steps": 20,
   "max_steps": 25,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 1,
+  "save_steps": 100,
   "stateful_callbacks": {
     "TrainerControl": {
       "args": {

checkpoint-25/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4a0e5595bc52473e018b00453670eb5d577d810e5ddec260ef9e96ae80799b79
 size 5841

 version https://git-lfs.github.com/spec/v1
+oid sha256:8764a662c742fe562180326e706ddcaa952662d13772979a9bd2edb6a466fb8d
 size 5841

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6a42f0dfd4f35726809bedde33d43533382f05320f51b34559ecd66a6ab4a95e
 size 3096165928

 version https://git-lfs.github.com/spec/v1
+oid sha256:1b7f81ce579291f35875ee78d87e54977deb1632985cbffd19debfc87c16f319
 size 3096165928

tokenizer.json CHANGED Viewed

@@ -1,21 +1,7 @@
 {
   "version": "1.0",
-  "truncation": {
-    "direction": "Right",
-    "max_length": 768,
-    "strategy": "LongestFirst",
-    "stride": 0
-  },
-  "padding": {
-    "strategy": {
-      "Fixed": 768
-    },
-    "direction": "Right",
-    "pad_to_multiple_of": null,
-    "pad_id": 50256,
-    "pad_type_id": 0,
-    "pad_token": "<|endoftext|>"
-  },
   "added_tokens": [
     {
       "id": 50256,

 {
   "version": "1.0",
+  "truncation": null,
+  "padding": null,
   "added_tokens": [
     {
       "id": 50256,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4a0e5595bc52473e018b00453670eb5d577d810e5ddec260ef9e96ae80799b79
 size 5841

 version https://git-lfs.github.com/spec/v1
+oid sha256:8764a662c742fe562180326e706ddcaa952662d13772979a9bd2edb6a466fb8d
 size 5841

training_log.json CHANGED Viewed

@@ -1,24 +1,17 @@
 [
   {
-    "loss": 8.5763,
-    "grad_norm": 19.882919311523438,
-    "learning_rate": 8e-07,
-    "epoch": 0.4,
-    "step": 10
-  },
-  {
-    "loss": 8.2046,
-    "grad_norm": 10.610285758972168,
-    "learning_rate": 3e-07,
     "epoch": 0.8,
     "step": 20
   },
   {
-    "train_runtime": 619.8465,
-    "train_samples_per_second": 0.161,
-    "train_steps_per_second": 0.04,
     "total_flos": 326426296320000.0,
-    "train_loss": 8.485690612792968,
     "epoch": 1.0,
     "step": 25
   }

 [
   {
+    "loss": 8.5489,
+    "grad_norm": 11.499434471130371,
+    "learning_rate": 2.608695652173913e-09,
     "epoch": 0.8,
     "step": 20
   },
   {
+    "train_runtime": 648.8694,
+    "train_samples_per_second": 0.154,
+    "train_steps_per_second": 0.039,
     "total_flos": 326426296320000.0,
+    "train_loss": 8.712354888916016,
     "epoch": 1.0,
     "step": 25
   }