mgh6 commited on
Commit
9ccb022
·
verified ·
1 Parent(s): 9de8b8e

Training in progress, epoch 4, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:05ac4f10040e66e431df938b7856d13f664df0b46d6101710def3a334fcb9ba6
3
  size 2610104820
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b49e9d5c8dd881f520e5a83128f40de519e68051af511937686445660ec5001b
3
  size 2610104820
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:75140785cd75a1282efaf5e3f8124ffe807377629f03660cc850719c0ef15a2b
3
  size 5210004271
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef26bd0d9cddd87b41bd441bf83979bef25265f8afb106bf9f07ea1c78276a60
3
  size 5210004271
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d01c0856a6fb316f12ae7b5a00934bd3a02b2c39928e0f3f92795aaa541bbc2
3
  size 15006
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7cf274d687459d8fbef424ee490939d2e6b5b3ea4569321a0d69cd2a401ebb4
3
  size 15006
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9885f6cee74ee5ecf8b98902b21218a1e0a6e8b4b6018e56d76ad82d9af7fb58
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:847be9d40b77e3bc7d7f6246e96a0e0054d918fd2ef8f822e1dd9b59a4a52a77
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 1.3419935703277588,
3
- "best_model_checkpoint": "mgh6/HTH_prob/checkpoint-976",
4
- "epoch": 3.9960454139558617,
5
  "eval_steps": 500,
6
- "global_step": 976,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -67,6 +67,21 @@
67
  "eval_samples_per_second": 32.751,
68
  "eval_steps_per_second": 16.376,
69
  "step": 976
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
70
  }
71
  ],
72
  "logging_steps": 500,
 
1
  {
2
+ "best_metric": 1.3339548110961914,
3
+ "best_model_checkpoint": "mgh6/HTH_prob/checkpoint-1220",
4
+ "epoch": 4.996045413955862,
5
  "eval_steps": 500,
6
+ "global_step": 1220,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
67
  "eval_samples_per_second": 32.751,
68
  "eval_steps_per_second": 16.376,
69
  "step": 976
70
+ },
71
+ {
72
+ "epoch": 4.996045413955862,
73
+ "grad_norm": 0.16875308752059937,
74
+ "learning_rate": 0.0009166666666666666,
75
+ "loss": 1.3448,
76
+ "step": 1220
77
+ },
78
+ {
79
+ "epoch": 4.996045413955862,
80
+ "eval_loss": 1.3339548110961914,
81
+ "eval_runtime": 25.1789,
82
+ "eval_samples_per_second": 32.805,
83
+ "eval_steps_per_second": 16.403,
84
+ "step": 1220
85
  }
86
  ],
87
  "logging_steps": 500,