ccore commited on
Commit
0de2a62
·
verified ·
1 Parent(s): 97dbd71

Training in progress, epoch 7, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4bc8780ec469e6d65fd76e397e5c1a7d5d3b3e5c3cfbe2f53fb093827288fb20
3
  size 500979600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cf8f08f616176452394d58e4224ada71da7d64b801e705eb0b77875c79a4da0
3
  size 500979600
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f1d9b70c27ea33e0731fe9748b5ef52c31397ed8d7209528664c48c6f4c5cd2
3
  size 1002078330
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a168c21d32e0ab0112605e3b30fc1d7b10b74cadd6992eeb837a29e605090ee8
3
  size 1002078330
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c66de8aeca130c769d7a7748933024a1db68486c88d7a55d3b6364277d7e51f2
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5dbb430077813eebb78e89f25ad57a8b8a506e2650404fdf80d07e549f36aeda
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:38c770930cf4a784f6f3c687a772f7b0f7e7c1fc226d92e5bdca2a293d724a84
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b9862d898cb0a9519e8aaf124fb3ce78820e2fee42eb8cbf3caef99627a3651
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.6723850965499878,
3
  "best_model_checkpoint": "./opt_trained3/checkpoint-90",
4
- "epoch": 6.0,
5
  "eval_steps": 500,
6
- "global_step": 90,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -55,6 +55,14 @@
55
  "eval_samples_per_second": 50.427,
56
  "eval_steps_per_second": 12.607,
57
  "step": 90
 
 
 
 
 
 
 
 
58
  }
59
  ],
60
  "logging_steps": 500,
@@ -74,7 +82,7 @@
74
  "attributes": {}
75
  }
76
  },
77
- "total_flos": 3339633680640000.0,
78
  "train_batch_size": 24,
79
  "trial_name": null,
80
  "trial_params": null
 
1
  {
2
  "best_metric": 0.6723850965499878,
3
  "best_model_checkpoint": "./opt_trained3/checkpoint-90",
4
+ "epoch": 7.0,
5
  "eval_steps": 500,
6
+ "global_step": 105,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
55
  "eval_samples_per_second": 50.427,
56
  "eval_steps_per_second": 12.607,
57
  "step": 90
58
+ },
59
+ {
60
+ "epoch": 7.0,
61
+ "eval_loss": 0.6734561920166016,
62
+ "eval_runtime": 5.9536,
63
+ "eval_samples_per_second": 50.39,
64
+ "eval_steps_per_second": 12.598,
65
+ "step": 105
66
  }
67
  ],
68
  "logging_steps": 500,
 
82
  "attributes": {}
83
  }
84
  },
85
+ "total_flos": 3896239294080000.0,
86
  "train_batch_size": 24,
87
  "trial_name": null,
88
  "trial_params": null