mgh6 commited on
Commit
3c1776a
·
verified ·
1 Parent(s): 0b30024

Training in progress, epoch 2, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a4c6f5313c5413e947c3b9ae8fbdcd3db5cfb17ae9d38f3845a0d90a0a99de4
3
  size 2708729576
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c679b10aa2b443874b6a9292e3aae512f5bccabe564b7ded414ea66831aa3f8
3
  size 2708729576
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa9bcb9d383cd758daed3e9bdac436feaaa8ace4983afd451ce084e4618839ef
3
  size 52499200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac2bb89e904aedd054556f139faebaa82a167ab945f6753087d8528f8a3a6120
3
  size 52499200
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b35b4cd4104958a3e34a87e84eee852763c80157fefbeae8abd4d6ed6ea94168
3
  size 15006
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:049c51626ff833ffb21f7771468093aef482329a954eee51e7f93ee61f521bdf
3
  size 15006
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bca4dbe650e04bc8012dd3f1938dfb2a637329721abd75c3bd59d28a64007b54
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e8b7bfccb9c07860bceffabef3a52060cc451a19d3abd90d284c09f7120dba6
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.0,
5
  "eval_steps": 50,
6
- "global_step": 129,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -35,6 +35,48 @@
35
  "eval_samples_per_second": 21.847,
36
  "eval_steps_per_second": 5.462,
37
  "step": 100
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
38
  }
39
  ],
40
  "logging_steps": 50,
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.0,
5
  "eval_steps": 50,
6
+ "global_step": 258,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
35
  "eval_samples_per_second": 21.847,
36
  "eval_steps_per_second": 5.462,
37
  "step": 100
38
+ },
39
+ {
40
+ "epoch": 1.16398243045388,
41
+ "grad_norm": 502497.4375,
42
+ "learning_rate": 8.828125000000001e-05,
43
+ "loss": 3495.4003,
44
+ "step": 150
45
+ },
46
+ {
47
+ "epoch": 1.16398243045388,
48
+ "eval_runtime": 19.7678,
49
+ "eval_samples_per_second": 21.854,
50
+ "eval_steps_per_second": 5.463,
51
+ "step": 150
52
+ },
53
+ {
54
+ "epoch": 1.5544167886774036,
55
+ "grad_norm": 733164.8125,
56
+ "learning_rate": 8.4375e-05,
57
+ "loss": 3503.1944,
58
+ "step": 200
59
+ },
60
+ {
61
+ "epoch": 1.5544167886774036,
62
+ "eval_runtime": 19.8051,
63
+ "eval_samples_per_second": 21.813,
64
+ "eval_steps_per_second": 5.453,
65
+ "step": 200
66
+ },
67
+ {
68
+ "epoch": 1.9448511469009273,
69
+ "grad_norm": 385944.6875,
70
+ "learning_rate": 8.046875e-05,
71
+ "loss": 2722.6881,
72
+ "step": 250
73
+ },
74
+ {
75
+ "epoch": 1.9448511469009273,
76
+ "eval_runtime": 19.7807,
77
+ "eval_samples_per_second": 21.839,
78
+ "eval_steps_per_second": 5.46,
79
+ "step": 250
80
  }
81
  ],
82
  "logging_steps": 50,