ales commited on
Commit
69c7d3e
·
1 Parent(s): c54ad8c

End of training

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 1.05,
3
- "eval_loss": 0.974454939365387,
4
- "eval_runtime": 20.3472,
5
  "eval_samples": 64,
6
- "eval_samples_per_second": 3.145,
7
- "eval_steps_per_second": 0.098,
8
- "eval_wer": 75.27472527472527,
9
- "train_loss": 0.041942973931630455,
10
- "train_runtime": 33.8193,
11
- "train_samples_per_second": 18.924,
12
- "train_steps_per_second": 0.591
13
  }
 
1
  {
2
+ "epoch": 1.0,
3
+ "eval_loss": 0.6197173595428467,
4
+ "eval_runtime": 18.6322,
5
  "eval_samples": 64,
6
+ "eval_samples_per_second": 3.435,
7
+ "eval_steps_per_second": 0.107,
8
+ "eval_wer": 60.43956043956044,
9
+ "train_loss": 0.6153274965286255,
10
+ "train_runtime": 782.3972,
11
+ "train_samples_per_second": 4.09,
12
+ "train_steps_per_second": 0.128
13
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 1.05,
3
- "eval_loss": 0.974454939365387,
4
- "eval_runtime": 20.3472,
5
  "eval_samples": 64,
6
- "eval_samples_per_second": 3.145,
7
- "eval_steps_per_second": 0.098,
8
- "eval_wer": 75.27472527472527
9
  }
 
1
  {
2
+ "epoch": 1.0,
3
+ "eval_loss": 0.6197173595428467,
4
+ "eval_runtime": 18.6322,
5
  "eval_samples": 64,
6
+ "eval_samples_per_second": 3.435,
7
+ "eval_steps_per_second": 0.107,
8
+ "eval_wer": 60.43956043956044
9
  }
runs/Dec12_19-28-45_13ea4557542f/events.out.tfevents.1670874502.13ea4557542f.8478.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bc918c0875efeac070effa512c0f38bc47ccada1467ef3d4c037fd4f656d329
3
+ size 352
train.log CHANGED
@@ -33,3 +33,9 @@
33
  {'loss': 0.6678, 'learning_rate': 3.1578947368421056e-06, 'epoch': 1.0}
34
  {'eval_loss': 0.5758526921272278, 'eval_wer': 61.53846153846154, 'eval_runtime': 19.5593, 'eval_samples_per_second': 3.272, 'eval_steps_per_second': 0.102, 'epoch': 1.0}
35
  {'train_runtime': 782.3972, 'train_samples_per_second': 4.09, 'train_steps_per_second': 0.128, 'train_loss': 0.6153274965286255, 'epoch': 1.0}
 
 
 
 
 
 
 
33
  {'loss': 0.6678, 'learning_rate': 3.1578947368421056e-06, 'epoch': 1.0}
34
  {'eval_loss': 0.5758526921272278, 'eval_wer': 61.53846153846154, 'eval_runtime': 19.5593, 'eval_samples_per_second': 3.272, 'eval_steps_per_second': 0.102, 'epoch': 1.0}
35
  {'train_runtime': 782.3972, 'train_samples_per_second': 4.09, 'train_steps_per_second': 0.128, 'train_loss': 0.6153274965286255, 'epoch': 1.0}
36
+ ***** train metrics *****
37
+ epoch = 1.0
38
+ train_loss = 0.6153
39
+ train_runtime = 0:13:02.39
40
+ train_samples_per_second = 4.09
41
+ train_steps_per_second = 0.128
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 1.05,
3
- "train_loss": 0.041942973931630455,
4
- "train_runtime": 33.8193,
5
- "train_samples_per_second": 18.924,
6
- "train_steps_per_second": 0.591
7
  }
 
1
  {
2
+ "epoch": 1.0,
3
+ "train_loss": 0.6153274965286255,
4
+ "train_runtime": 782.3972,
5
+ "train_samples_per_second": 4.09,
6
+ "train_steps_per_second": 0.128
7
  }
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 75.27472527472527,
3
- "best_model_checkpoint": "./checkpoint-20",
4
- "epoch": 1.05,
5
- "global_step": 21,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -38,18 +38,138 @@
38
  "step": 20
39
  },
40
  {
41
- "epoch": 1.05,
42
- "step": 21,
43
- "total_flos": 1.654389080064e+16,
44
- "train_loss": 0.041942973931630455,
45
- "train_runtime": 33.8193,
46
- "train_samples_per_second": 18.924,
47
- "train_steps_per_second": 0.591
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
48
  }
49
  ],
50
- "max_steps": 20,
51
  "num_train_epochs": 9223372036854775807,
52
- "total_flos": 1.654389080064e+16,
53
  "trial_name": null,
54
  "trial_params": null
55
  }
 
1
  {
2
+ "best_metric": 60.43956043956044,
3
+ "best_model_checkpoint": "./checkpoint-70",
4
+ "epoch": 1.0,
5
+ "global_step": 100,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
38
  "step": 20
39
  },
40
  {
41
+ "epoch": 0.3,
42
+ "learning_rate": 7.68421052631579e-05,
43
+ "loss": 0.9934,
44
+ "step": 30
45
+ },
46
+ {
47
+ "epoch": 0.3,
48
+ "eval_loss": 0.811407208442688,
49
+ "eval_runtime": 17.9554,
50
+ "eval_samples_per_second": 3.564,
51
+ "eval_steps_per_second": 0.111,
52
+ "eval_wer": 72.16117216117216,
53
+ "step": 30
54
+ },
55
+ {
56
+ "epoch": 0.4,
57
+ "learning_rate": 6.631578947368421e-05,
58
+ "loss": 0.9568,
59
+ "step": 40
60
+ },
61
+ {
62
+ "epoch": 0.4,
63
+ "eval_loss": 0.7814445495605469,
64
+ "eval_runtime": 44.1521,
65
+ "eval_samples_per_second": 1.45,
66
+ "eval_steps_per_second": 0.045,
67
+ "eval_wer": 72.7106227106227,
68
+ "step": 40
69
+ },
70
+ {
71
+ "epoch": 0.5,
72
+ "learning_rate": 5.5789473684210526e-05,
73
+ "loss": 0.6856,
74
+ "step": 50
75
+ },
76
+ {
77
+ "epoch": 0.5,
78
+ "eval_loss": 0.7517387866973877,
79
+ "eval_runtime": 19.7741,
80
+ "eval_samples_per_second": 3.237,
81
+ "eval_steps_per_second": 0.101,
82
+ "eval_wer": 76.92307692307693,
83
+ "step": 50
84
+ },
85
+ {
86
+ "epoch": 0.6,
87
+ "learning_rate": 4.5263157894736846e-05,
88
+ "loss": 0.7808,
89
+ "step": 60
90
+ },
91
+ {
92
+ "epoch": 0.6,
93
+ "eval_loss": 0.6514347195625305,
94
+ "eval_runtime": 19.745,
95
+ "eval_samples_per_second": 3.241,
96
+ "eval_steps_per_second": 0.101,
97
+ "eval_wer": 63.55311355311355,
98
+ "step": 60
99
+ },
100
+ {
101
+ "epoch": 0.7,
102
+ "learning_rate": 3.473684210526316e-05,
103
+ "loss": 0.6826,
104
+ "step": 70
105
+ },
106
+ {
107
+ "epoch": 0.7,
108
+ "eval_loss": 0.6197173595428467,
109
+ "eval_runtime": 19.7014,
110
+ "eval_samples_per_second": 3.248,
111
+ "eval_steps_per_second": 0.102,
112
+ "eval_wer": 60.43956043956044,
113
+ "step": 70
114
+ },
115
+ {
116
+ "epoch": 0.8,
117
+ "learning_rate": 2.4210526315789474e-05,
118
+ "loss": 0.7832,
119
+ "step": 80
120
+ },
121
+ {
122
+ "epoch": 0.8,
123
+ "eval_loss": 0.6129069328308105,
124
+ "eval_runtime": 18.9507,
125
+ "eval_samples_per_second": 3.377,
126
+ "eval_steps_per_second": 0.106,
127
+ "eval_wer": 65.93406593406593,
128
+ "step": 80
129
+ },
130
+ {
131
+ "epoch": 0.9,
132
+ "learning_rate": 1.3684210526315791e-05,
133
+ "loss": 0.6031,
134
+ "step": 90
135
+ },
136
+ {
137
+ "epoch": 0.9,
138
+ "eval_loss": 0.5876654982566833,
139
+ "eval_runtime": 20.4075,
140
+ "eval_samples_per_second": 3.136,
141
+ "eval_steps_per_second": 0.098,
142
+ "eval_wer": 61.35531135531136,
143
+ "step": 90
144
+ },
145
+ {
146
+ "epoch": 1.0,
147
+ "learning_rate": 3.1578947368421056e-06,
148
+ "loss": 0.6678,
149
+ "step": 100
150
+ },
151
+ {
152
+ "epoch": 1.0,
153
+ "eval_loss": 0.5758526921272278,
154
+ "eval_runtime": 19.5593,
155
+ "eval_samples_per_second": 3.272,
156
+ "eval_steps_per_second": 0.102,
157
+ "eval_wer": 61.53846153846154,
158
+ "step": 100
159
+ },
160
+ {
161
+ "epoch": 1.0,
162
+ "step": 100,
163
+ "total_flos": 7.8780432384e+16,
164
+ "train_loss": 0.6153274965286255,
165
+ "train_runtime": 782.3972,
166
+ "train_samples_per_second": 4.09,
167
+ "train_steps_per_second": 0.128
168
  }
169
  ],
170
+ "max_steps": 100,
171
  "num_train_epochs": 9223372036854775807,
172
+ "total_flos": 7.8780432384e+16,
173
  "trial_name": null,
174
  "trial_params": null
175
  }