Upload folder using huggingface_hub

#3
by michaelsh - opened
Files changed (4) hide show
  1. optimizer.pt +1 -1
  2. pytorch_model.bin +1 -1
  3. trainer_state.json +77 -29
  4. training_args.bin +1 -1
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4601382e37ca15b9060d170a50d1ce572d6e3ffde3be7fc76354d533f3101faa
3
  size 302183045
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce7ec66048f0a6dbe35016acc67dbf341024e5dae5f14d6429219b36382cf6f5
3
  size 302183045
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2aceaf170565b15f68cf16576729c9d98a02f1b0bf1178bc349a1e8bcb501ba5
3
  size 151099049
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0099691db067fe152ea4f9295dfb3c6f98492b719fa87d0c05f8b9ab3e237107
3
  size 151099049
trainer_state.json CHANGED
@@ -9,28 +9,46 @@
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
- "eval_loss": 1.5109972953796387,
13
- "eval_runtime": 39.8139,
14
- "eval_samples_per_second": 2.688,
15
- "eval_steps_per_second": 0.176,
 
 
 
 
 
 
16
  "eval_wer": 0.7574039067422811,
17
  "eval_wer_ortho": 0.8027704485488126,
18
  "step": 29
19
  },
20
  {
21
  "epoch": 2.0,
22
- "eval_loss": 0.5695223808288574,
23
- "eval_runtime": 34.2898,
24
- "eval_samples_per_second": 3.12,
25
- "eval_steps_per_second": 0.204,
 
 
 
 
 
 
26
  "eval_wer": 0.43163201008191554,
27
  "eval_wer_ortho": 0.4346965699208443,
28
  "step": 58
29
  },
30
  {
31
  "epoch": 3.0,
32
- "eval_loss": 0.5170513987541199,
33
- "eval_runtime": 33.1576,
 
 
 
 
 
 
34
  "eval_samples_per_second": 3.227,
35
  "eval_steps_per_second": 0.211,
36
  "eval_wer": 0.391304347826087,
@@ -39,39 +57,63 @@
39
  },
40
  {
41
  "epoch": 4.0,
42
- "eval_loss": 0.5165203213691711,
43
- "eval_runtime": 33.1994,
44
- "eval_samples_per_second": 3.223,
45
- "eval_steps_per_second": 0.211,
 
 
 
 
 
 
46
  "eval_wer": 0.3906742281033396,
47
  "eval_wer_ortho": 0.39116094986807387,
48
  "step": 116
49
  },
50
  {
51
  "epoch": 5.0,
52
- "eval_loss": 0.5296039581298828,
53
- "eval_runtime": 33.4623,
54
- "eval_samples_per_second": 3.198,
55
- "eval_steps_per_second": 0.209,
 
 
 
 
 
 
56
  "eval_wer": 0.38248267170762446,
57
  "eval_wer_ortho": 0.38192612137203164,
58
  "step": 145
59
  },
60
  {
61
  "epoch": 6.0,
62
- "eval_loss": 0.5532421469688416,
63
- "eval_runtime": 33.084,
64
- "eval_samples_per_second": 3.234,
65
- "eval_steps_per_second": 0.212,
 
 
 
 
 
 
66
  "eval_wer": 0.37366099558916194,
67
  "eval_wer_ortho": 0.37467018469656993,
68
  "step": 174
69
  },
70
  {
71
  "epoch": 7.0,
72
- "eval_loss": 0.5614312887191772,
73
- "eval_runtime": 33.2048,
74
- "eval_samples_per_second": 3.222,
 
 
 
 
 
 
75
  "eval_steps_per_second": 0.211,
76
  "eval_wer": 0.38815374921235035,
77
  "eval_wer_ortho": 0.3865435356200528,
@@ -79,10 +121,16 @@
79
  },
80
  {
81
  "epoch": 8.0,
82
- "eval_loss": 0.6009427309036255,
83
- "eval_runtime": 34.1493,
84
- "eval_samples_per_second": 3.133,
85
- "eval_steps_per_second": 0.205,
 
 
 
 
 
 
86
  "eval_wer": 0.36546943919344677,
87
  "eval_wer_ortho": 0.3627968337730871,
88
  "step": 232
 
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
+ "learning_rate": 1e-05,
13
+ "loss": 3.1128,
14
+ "step": 29
15
+ },
16
+ {
17
+ "epoch": 1.0,
18
+ "eval_loss": 1.5109970569610596,
19
+ "eval_runtime": 39.2215,
20
+ "eval_samples_per_second": 2.728,
21
+ "eval_steps_per_second": 0.178,
22
  "eval_wer": 0.7574039067422811,
23
  "eval_wer_ortho": 0.8027704485488126,
24
  "step": 29
25
  },
26
  {
27
  "epoch": 2.0,
28
+ "learning_rate": 1e-05,
29
+ "loss": 0.6583,
30
+ "step": 58
31
+ },
32
+ {
33
+ "epoch": 2.0,
34
+ "eval_loss": 0.569522500038147,
35
+ "eval_runtime": 33.882,
36
+ "eval_samples_per_second": 3.158,
37
+ "eval_steps_per_second": 0.207,
38
  "eval_wer": 0.43163201008191554,
39
  "eval_wer_ortho": 0.4346965699208443,
40
  "step": 58
41
  },
42
  {
43
  "epoch": 3.0,
44
+ "learning_rate": 1e-05,
45
+ "loss": 0.3271,
46
+ "step": 87
47
+ },
48
+ {
49
+ "epoch": 3.0,
50
+ "eval_loss": 0.5170509219169617,
51
+ "eval_runtime": 33.1578,
52
  "eval_samples_per_second": 3.227,
53
  "eval_steps_per_second": 0.211,
54
  "eval_wer": 0.391304347826087,
 
57
  },
58
  {
59
  "epoch": 4.0,
60
+ "learning_rate": 1e-05,
61
+ "loss": 0.2003,
62
+ "step": 116
63
+ },
64
+ {
65
+ "epoch": 4.0,
66
+ "eval_loss": 0.5165189504623413,
67
+ "eval_runtime": 33.0788,
68
+ "eval_samples_per_second": 3.235,
69
+ "eval_steps_per_second": 0.212,
70
  "eval_wer": 0.3906742281033396,
71
  "eval_wer_ortho": 0.39116094986807387,
72
  "step": 116
73
  },
74
  {
75
  "epoch": 5.0,
76
+ "learning_rate": 1e-05,
77
+ "loss": 0.1189,
78
+ "step": 145
79
+ },
80
+ {
81
+ "epoch": 5.0,
82
+ "eval_loss": 0.5296050906181335,
83
+ "eval_runtime": 33.2182,
84
+ "eval_samples_per_second": 3.221,
85
+ "eval_steps_per_second": 0.211,
86
  "eval_wer": 0.38248267170762446,
87
  "eval_wer_ortho": 0.38192612137203164,
88
  "step": 145
89
  },
90
  {
91
  "epoch": 6.0,
92
+ "learning_rate": 1e-05,
93
+ "loss": 0.0623,
94
+ "step": 174
95
+ },
96
+ {
97
+ "epoch": 6.0,
98
+ "eval_loss": 0.553246021270752,
99
+ "eval_runtime": 33.3882,
100
+ "eval_samples_per_second": 3.205,
101
+ "eval_steps_per_second": 0.21,
102
  "eval_wer": 0.37366099558916194,
103
  "eval_wer_ortho": 0.37467018469656993,
104
  "step": 174
105
  },
106
  {
107
  "epoch": 7.0,
108
+ "learning_rate": 1e-05,
109
+ "loss": 0.0326,
110
+ "step": 203
111
+ },
112
+ {
113
+ "epoch": 7.0,
114
+ "eval_loss": 0.5614295601844788,
115
+ "eval_runtime": 33.1777,
116
+ "eval_samples_per_second": 3.225,
117
  "eval_steps_per_second": 0.211,
118
  "eval_wer": 0.38815374921235035,
119
  "eval_wer_ortho": 0.3865435356200528,
 
121
  },
122
  {
123
  "epoch": 8.0,
124
+ "learning_rate": 1e-05,
125
+ "loss": 0.0149,
126
+ "step": 232
127
+ },
128
+ {
129
+ "epoch": 8.0,
130
+ "eval_loss": 0.6009227633476257,
131
+ "eval_runtime": 33.313,
132
+ "eval_samples_per_second": 3.212,
133
+ "eval_steps_per_second": 0.21,
134
  "eval_wer": 0.36546943919344677,
135
  "eval_wer_ortho": 0.3627968337730871,
136
  "step": 232
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:081a84ed2977aff43516b2448a4decafc69047f8b0537bc45625f2b4d4d49ff5
3
  size 4155
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bcaa651a0a8b268e2d17fe0d8d04a867832736edf6f51740cb2f6ba3a317d63
3
  size 4155