Yuvrajg2107 commited on
Commit
cce6eaa
·
verified ·
1 Parent(s): cbc5915

Training in progress, step 4000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6d7421efb0f77cd2ad05e257eaaa7cf70bc46b98f46b55a33fcb605105540605
3
  size 1340623936
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbbc7c632d4d6f6dc374492bd1211cba1a35d6ffeddbfb05e32ba3a1a59c6c92
3
  size 1340623936
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:97cd9487290e93a4cf8df97c810828fa6608cfd8679b75d5176a1b829226af00
3
  size 2681480830
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f074e1f4dcfde9a10a17643892cc0dffb9ce7d3df88081d2f01e5283c4103d1d
3
  size 2681480830
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e484b91022d49823d8d81e38c9d2aecc8d11dd67a5a779bad4167814a1359c3d
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:713fbe99f9819d314ca7c04ce5f81ee51364f89ca336ef4d1337ed0aadfb47e5
3
  size 14645
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5ac1c46a2776d12775d23d0f587efc112188137ce2140da35bc15d301c9f620e
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0033c7745b46bdca3ecab5787678834ca68f7f7e1288869dceeb38812abc253
3
  size 1383
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d3f655ea9c5a4a9f86c577483cce348f86f4499f93b7851c6926bdee4b92c1f
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44bf4923ec42942364989fd2f30726b763bdfd466c393a6e0a85d3fa348231ab
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 2000,
3
  "best_metric": 0.07912886142730713,
4
  "best_model_checkpoint": "./training_output/checkpoint-2000",
5
- "epoch": 0.375,
6
  "eval_steps": 1000,
7
- "global_step": 3000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -77,6 +77,29 @@
77
  "eval_samples_per_second": 15.203,
78
  "eval_steps_per_second": 0.95,
79
  "step": 3000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
80
  }
81
  ],
82
  "logging_steps": 500,
@@ -96,7 +119,7 @@
96
  "attributes": {}
97
  }
98
  },
99
- "total_flos": 1.1183176359936e+16,
100
  "train_batch_size": 2,
101
  "trial_name": null,
102
  "trial_params": null
 
2
  "best_global_step": 2000,
3
  "best_metric": 0.07912886142730713,
4
  "best_model_checkpoint": "./training_output/checkpoint-2000",
5
+ "epoch": 0.5,
6
  "eval_steps": 1000,
7
+ "global_step": 4000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
77
  "eval_samples_per_second": 15.203,
78
  "eval_steps_per_second": 0.95,
79
  "step": 3000
80
+ },
81
+ {
82
+ "epoch": 0.4375,
83
+ "grad_norm": 10.261446952819824,
84
+ "learning_rate": 1.1252500000000001e-05,
85
+ "loss": 0.0581,
86
+ "step": 3500
87
+ },
88
+ {
89
+ "epoch": 0.5,
90
+ "grad_norm": 6.691280364990234,
91
+ "learning_rate": 1.0002500000000001e-05,
92
+ "loss": 0.1161,
93
+ "step": 4000
94
+ },
95
+ {
96
+ "epoch": 0.5,
97
+ "eval_accuracy": 0.350625,
98
+ "eval_loss": 0.22534234821796417,
99
+ "eval_runtime": 518.3611,
100
+ "eval_samples_per_second": 15.433,
101
+ "eval_steps_per_second": 0.965,
102
+ "step": 4000
103
  }
104
  ],
105
  "logging_steps": 500,
 
119
  "attributes": {}
120
  }
121
  },
122
+ "total_flos": 1.4910901813248e+16,
123
  "train_batch_size": 2,
124
  "trial_name": null,
125
  "trial_params": null