pavitemple commited on
Commit
b704cd0
·
1 Parent(s): e932f1b

End of training

Browse files
Files changed (3) hide show
  1. all_results.json +8 -0
  2. test_results.json +8 -0
  3. trainer_state.json +172 -0
all_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 7.07,
3
+ "eval_accuracy": 0.5161290322580645,
4
+ "eval_loss": 1.0765262842178345,
5
+ "eval_runtime": 74.2165,
6
+ "eval_samples_per_second": 0.418,
7
+ "eval_steps_per_second": 0.108
8
+ }
test_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 7.07,
3
+ "eval_accuracy": 0.5161290322580645,
4
+ "eval_loss": 1.0765262842178345,
5
+ "eval_runtime": 74.2165,
6
+ "eval_samples_per_second": 0.418,
7
+ "eval_steps_per_second": 0.108
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,172 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.56,
3
+ "best_model_checkpoint": "finetuned-Accident-Video-subset/checkpoint-84",
4
+ "epoch": 7.066666666666666,
5
+ "eval_steps": 500,
6
+ "global_step": 90,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.11,
13
+ "learning_rate": 4.938271604938271e-05,
14
+ "loss": 1.5898,
15
+ "step": 10
16
+ },
17
+ {
18
+ "epoch": 0.13,
19
+ "eval_accuracy": 0.48,
20
+ "eval_loss": 1.317312479019165,
21
+ "eval_runtime": 78.1417,
22
+ "eval_samples_per_second": 0.32,
23
+ "eval_steps_per_second": 0.09,
24
+ "step": 12
25
+ },
26
+ {
27
+ "epoch": 1.09,
28
+ "learning_rate": 4.3209876543209875e-05,
29
+ "loss": 1.2104,
30
+ "step": 20
31
+ },
32
+ {
33
+ "epoch": 1.13,
34
+ "eval_accuracy": 0.4,
35
+ "eval_loss": 1.2156548500061035,
36
+ "eval_runtime": 75.0252,
37
+ "eval_samples_per_second": 0.333,
38
+ "eval_steps_per_second": 0.093,
39
+ "step": 24
40
+ },
41
+ {
42
+ "epoch": 2.07,
43
+ "learning_rate": 3.7037037037037037e-05,
44
+ "loss": 1.418,
45
+ "step": 30
46
+ },
47
+ {
48
+ "epoch": 2.13,
49
+ "eval_accuracy": 0.52,
50
+ "eval_loss": 1.1616722345352173,
51
+ "eval_runtime": 75.4314,
52
+ "eval_samples_per_second": 0.331,
53
+ "eval_steps_per_second": 0.093,
54
+ "step": 36
55
+ },
56
+ {
57
+ "epoch": 3.04,
58
+ "learning_rate": 3.08641975308642e-05,
59
+ "loss": 1.1202,
60
+ "step": 40
61
+ },
62
+ {
63
+ "epoch": 3.13,
64
+ "eval_accuracy": 0.52,
65
+ "eval_loss": 1.1278761625289917,
66
+ "eval_runtime": 70.2254,
67
+ "eval_samples_per_second": 0.356,
68
+ "eval_steps_per_second": 0.1,
69
+ "step": 48
70
+ },
71
+ {
72
+ "epoch": 4.02,
73
+ "learning_rate": 2.4691358024691357e-05,
74
+ "loss": 1.0015,
75
+ "step": 50
76
+ },
77
+ {
78
+ "epoch": 4.13,
79
+ "learning_rate": 1.8518518518518518e-05,
80
+ "loss": 1.2226,
81
+ "step": 60
82
+ },
83
+ {
84
+ "epoch": 4.13,
85
+ "eval_accuracy": 0.48,
86
+ "eval_loss": 1.1110718250274658,
87
+ "eval_runtime": 59.6068,
88
+ "eval_samples_per_second": 0.419,
89
+ "eval_steps_per_second": 0.117,
90
+ "step": 60
91
+ },
92
+ {
93
+ "epoch": 5.11,
94
+ "learning_rate": 1.2345679012345678e-05,
95
+ "loss": 1.1886,
96
+ "step": 70
97
+ },
98
+ {
99
+ "epoch": 5.13,
100
+ "eval_accuracy": 0.48,
101
+ "eval_loss": 1.072799801826477,
102
+ "eval_runtime": 59.8468,
103
+ "eval_samples_per_second": 0.418,
104
+ "eval_steps_per_second": 0.117,
105
+ "step": 72
106
+ },
107
+ {
108
+ "epoch": 6.09,
109
+ "learning_rate": 6.172839506172839e-06,
110
+ "loss": 1.0177,
111
+ "step": 80
112
+ },
113
+ {
114
+ "epoch": 6.13,
115
+ "eval_accuracy": 0.56,
116
+ "eval_loss": 1.0452561378479004,
117
+ "eval_runtime": 60.7954,
118
+ "eval_samples_per_second": 0.411,
119
+ "eval_steps_per_second": 0.115,
120
+ "step": 84
121
+ },
122
+ {
123
+ "epoch": 7.07,
124
+ "learning_rate": 0.0,
125
+ "loss": 1.0443,
126
+ "step": 90
127
+ },
128
+ {
129
+ "epoch": 7.07,
130
+ "eval_accuracy": 0.56,
131
+ "eval_loss": 1.0377601385116577,
132
+ "eval_runtime": 70.0346,
133
+ "eval_samples_per_second": 0.357,
134
+ "eval_steps_per_second": 0.1,
135
+ "step": 90
136
+ },
137
+ {
138
+ "epoch": 7.07,
139
+ "step": 90,
140
+ "total_flos": 4.2242719732383744e+17,
141
+ "train_loss": 1.2014519691467285,
142
+ "train_runtime": 1824.3873,
143
+ "train_samples_per_second": 0.197,
144
+ "train_steps_per_second": 0.049
145
+ },
146
+ {
147
+ "epoch": 7.07,
148
+ "eval_accuracy": 0.5161290322580645,
149
+ "eval_loss": 1.0765262842178345,
150
+ "eval_runtime": 82.8746,
151
+ "eval_samples_per_second": 0.374,
152
+ "eval_steps_per_second": 0.097,
153
+ "step": 90
154
+ },
155
+ {
156
+ "epoch": 7.07,
157
+ "eval_accuracy": 0.5161290322580645,
158
+ "eval_loss": 1.0765262842178345,
159
+ "eval_runtime": 74.2165,
160
+ "eval_samples_per_second": 0.418,
161
+ "eval_steps_per_second": 0.108,
162
+ "step": 90
163
+ }
164
+ ],
165
+ "logging_steps": 10,
166
+ "max_steps": 90,
167
+ "num_train_epochs": 9223372036854775807,
168
+ "save_steps": 500,
169
+ "total_flos": 4.2242719732383744e+17,
170
+ "trial_name": null,
171
+ "trial_params": null
172
+ }