ccore commited on
Commit
9f8bd15
·
verified ·
1 Parent(s): 66ab34f

Training in progress, epoch 7, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:acc7efc5ac731fed0225a95e6a6619debcf2385b4b55b86cd89af40df519b46e
3
  size 500979600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:576846bd48b72cd7aaf1830841153e585d029c6c4825445154a8e90cdd1d588d
3
  size 500979600
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8642788ff9b15322c67b31af5c83e47538f0e8734eb5c8110ac94b13c19fc8eb
3
  size 1002078330
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c72e158baa306f60707acab85d117f5dd90e0927a25c1e424ec553e2e2f4d5e
3
  size 1002078330
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c66de8aeca130c769d7a7748933024a1db68486c88d7a55d3b6364277d7e51f2
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5dbb430077813eebb78e89f25ad57a8b8a506e2650404fdf80d07e549f36aeda
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:38c770930cf4a784f6f3c687a772f7b0f7e7c1fc226d92e5bdca2a293d724a84
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b9862d898cb0a9519e8aaf124fb3ce78820e2fee42eb8cbf3caef99627a3651
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.6301519274711609,
3
  "best_model_checkpoint": "./opt_trained3/checkpoint-60",
4
- "epoch": 6.0,
5
  "eval_steps": 500,
6
- "global_step": 90,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -55,6 +55,14 @@
55
  "eval_samples_per_second": 50.134,
56
  "eval_steps_per_second": 12.534,
57
  "step": 90
 
 
 
 
 
 
 
 
58
  }
59
  ],
60
  "logging_steps": 500,
@@ -74,7 +82,7 @@
74
  "attributes": {}
75
  }
76
  },
77
- "total_flos": 3339633680640000.0,
78
  "train_batch_size": 24,
79
  "trial_name": null,
80
  "trial_params": null
 
1
  {
2
  "best_metric": 0.6301519274711609,
3
  "best_model_checkpoint": "./opt_trained3/checkpoint-60",
4
+ "epoch": 7.0,
5
  "eval_steps": 500,
6
+ "global_step": 105,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
55
  "eval_samples_per_second": 50.134,
56
  "eval_steps_per_second": 12.534,
57
  "step": 90
58
+ },
59
+ {
60
+ "epoch": 7.0,
61
+ "eval_loss": 0.6327991485595703,
62
+ "eval_runtime": 5.9926,
63
+ "eval_samples_per_second": 50.062,
64
+ "eval_steps_per_second": 12.516,
65
+ "step": 105
66
  }
67
  ],
68
  "logging_steps": 500,
 
82
  "attributes": {}
83
  }
84
  },
85
+ "total_flos": 3896239294080000.0,
86
  "train_batch_size": 24,
87
  "trial_name": null,
88
  "trial_params": null