merve HF Staff commited on
Commit
1741198
·
verified ·
1 Parent(s): cff5e6d

End of training

Browse files
Files changed (5) hide show
  1. README.md +24 -22
  2. all_results.json +32 -0
  3. eval_results.json +27 -0
  4. train_results.json +8 -0
  5. trainer_state.json +1583 -0
README.md CHANGED
@@ -3,6 +3,8 @@ library_name: transformers
3
  license: apache-2.0
4
  base_model: PekingU/rtdetr_v2_r18vd
5
  tags:
 
 
6
  - generated_from_trainer
7
  model-index:
8
  - name: mobile-ui-rtdetrv2
@@ -14,29 +16,29 @@ should probably proofread and complete it, then remove this comment. -->
14
 
15
  # mobile-ui-rtdetrv2
16
 
17
- This model is a fine-tuned version of [PekingU/rtdetr_v2_r18vd](https://huggingface.co/PekingU/rtdetr_v2_r18vd) on an unknown dataset.
18
  It achieves the following results on the evaluation set:
19
- - Loss: 7.5326
20
- - Map: 0.1598
21
- - Map 50: 0.2221
22
- - Map 75: 0.1589
23
- - Map Small: 0.0793
24
- - Map Medium: 0.2358
25
- - Map Large: 0.3415
26
- - Mar 1: 0.0499
27
- - Mar 10: 0.2576
28
- - Mar 100: 0.4897
29
- - Mar Small: 0.2705
30
- - Mar Medium: 0.5899
31
- - Mar Large: 0.8065
32
- - Map Group: 0.1105
33
- - Mar 100 Group: 0.5388
34
- - Map Image: 0.2522
35
- - Mar 100 Image: 0.6149
36
- - Map Rectangle: 0.1861
37
- - Mar 100 Rectangle: 0.4594
38
- - Map Text: 0.0905
39
- - Mar 100 Text: 0.3458
40
 
41
  ## Model description
42
 
 
3
  license: apache-2.0
4
  base_model: PekingU/rtdetr_v2_r18vd
5
  tags:
6
+ - object-detection
7
+ - vision
8
  - generated_from_trainer
9
  model-index:
10
  - name: mobile-ui-rtdetrv2
 
16
 
17
  # mobile-ui-rtdetrv2
18
 
19
+ This model is a fine-tuned version of [PekingU/rtdetr_v2_r18vd](https://huggingface.co/PekingU/rtdetr_v2_r18vd) on the mrtoy/mobile-ui-design dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 7.5546
22
+ - Map: 0.1631
23
+ - Map 50: 0.2291
24
+ - Map 75: 0.1615
25
+ - Map Small: 0.0809
26
+ - Map Medium: 0.2384
27
+ - Map Large: 0.3418
28
+ - Mar 1: 0.0502
29
+ - Mar 10: 0.2617
30
+ - Mar 100: 0.4934
31
+ - Mar Small: 0.2801
32
+ - Mar Medium: 0.5902
33
+ - Mar Large: 0.7942
34
+ - Map Group: 0.1156
35
+ - Mar 100 Group: 0.5438
36
+ - Map Image: 0.2472
37
+ - Mar 100 Image: 0.6086
38
+ - Map Rectangle: 0.1883
39
+ - Mar 100 Rectangle: 0.458
40
+ - Map Text: 0.1014
41
+ - Mar 100 Text: 0.3633
42
 
43
  ## Model description
44
 
all_results.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 30.0,
3
+ "eval_loss": 7.554591178894043,
4
+ "eval_map": 0.1631,
5
+ "eval_map_50": 0.2291,
6
+ "eval_map_75": 0.1615,
7
+ "eval_map_group": 0.1156,
8
+ "eval_map_image": 0.2472,
9
+ "eval_map_large": 0.3418,
10
+ "eval_map_medium": 0.2384,
11
+ "eval_map_rectangle": 0.1883,
12
+ "eval_map_small": 0.0809,
13
+ "eval_map_text": 0.1014,
14
+ "eval_mar_1": 0.0502,
15
+ "eval_mar_10": 0.2617,
16
+ "eval_mar_100": 0.4934,
17
+ "eval_mar_100_group": 0.5438,
18
+ "eval_mar_100_image": 0.6086,
19
+ "eval_mar_100_rectangle": 0.458,
20
+ "eval_mar_100_text": 0.3633,
21
+ "eval_mar_large": 0.7942,
22
+ "eval_mar_medium": 0.5902,
23
+ "eval_mar_small": 0.2801,
24
+ "eval_runtime": 17.1307,
25
+ "eval_samples_per_second": 7.005,
26
+ "eval_steps_per_second": 0.876,
27
+ "total_flos": 2.95288818499584e+18,
28
+ "train_loss": 12.287477396404933,
29
+ "train_runtime": 1674.3599,
30
+ "train_samples_per_second": 11.915,
31
+ "train_steps_per_second": 1.505
32
+ }
eval_results.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 30.0,
3
+ "eval_loss": 7.554591178894043,
4
+ "eval_map": 0.1631,
5
+ "eval_map_50": 0.2291,
6
+ "eval_map_75": 0.1615,
7
+ "eval_map_group": 0.1156,
8
+ "eval_map_image": 0.2472,
9
+ "eval_map_large": 0.3418,
10
+ "eval_map_medium": 0.2384,
11
+ "eval_map_rectangle": 0.1883,
12
+ "eval_map_small": 0.0809,
13
+ "eval_map_text": 0.1014,
14
+ "eval_mar_1": 0.0502,
15
+ "eval_mar_10": 0.2617,
16
+ "eval_mar_100": 0.4934,
17
+ "eval_mar_100_group": 0.5438,
18
+ "eval_mar_100_image": 0.6086,
19
+ "eval_mar_100_rectangle": 0.458,
20
+ "eval_mar_100_text": 0.3633,
21
+ "eval_mar_large": 0.7942,
22
+ "eval_mar_medium": 0.5902,
23
+ "eval_mar_small": 0.2801,
24
+ "eval_runtime": 17.1307,
25
+ "eval_samples_per_second": 7.005,
26
+ "eval_steps_per_second": 0.876
27
+ }
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 30.0,
3
+ "total_flos": 2.95288818499584e+18,
4
+ "train_loss": 12.287477396404933,
5
+ "train_runtime": 1674.3599,
6
+ "train_samples_per_second": 11.915,
7
+ "train_steps_per_second": 1.505
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,1583 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": 1932,
3
+ "best_metric": 0.166,
4
+ "best_model_checkpoint": "mobile-ui-rtdetrv2/checkpoint-1932",
5
+ "epoch": 30.0,
6
+ "eval_steps": 500,
7
+ "global_step": 2520,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0.2976190476190476,
14
+ "grad_norm": 33.42657470703125,
15
+ "learning_rate": 4.7619047619047615e-06,
16
+ "loss": 30.43977294921875,
17
+ "step": 25
18
+ },
19
+ {
20
+ "epoch": 0.5952380952380952,
21
+ "grad_norm": 19.833362579345703,
22
+ "learning_rate": 9.722222222222223e-06,
23
+ "loss": 26.7940478515625,
24
+ "step": 50
25
+ },
26
+ {
27
+ "epoch": 0.8928571428571429,
28
+ "grad_norm": 15.38772964477539,
29
+ "learning_rate": 1.4682539682539683e-05,
30
+ "loss": 22.560556640625,
31
+ "step": 75
32
+ },
33
+ {
34
+ "epoch": 1.0,
35
+ "eval_loss": 14.398598670959473,
36
+ "eval_map": 0.005,
37
+ "eval_map_50": 0.0119,
38
+ "eval_map_75": 0.0031,
39
+ "eval_map_group": 0.0113,
40
+ "eval_map_image": 0.0051,
41
+ "eval_map_large": 0.0154,
42
+ "eval_map_medium": 0.0061,
43
+ "eval_map_rectangle": 0.0031,
44
+ "eval_map_small": 0.0015,
45
+ "eval_map_text": 0.0006,
46
+ "eval_mar_1": 0.0056,
47
+ "eval_mar_10": 0.0315,
48
+ "eval_mar_100": 0.1098,
49
+ "eval_mar_100_group": 0.1591,
50
+ "eval_mar_100_image": 0.1275,
51
+ "eval_mar_100_rectangle": 0.1274,
52
+ "eval_mar_100_text": 0.0254,
53
+ "eval_mar_large": 0.2126,
54
+ "eval_mar_medium": 0.1272,
55
+ "eval_mar_small": 0.0351,
56
+ "eval_runtime": 19.2065,
57
+ "eval_samples_per_second": 6.248,
58
+ "eval_steps_per_second": 0.781,
59
+ "step": 84
60
+ },
61
+ {
62
+ "epoch": 1.1904761904761905,
63
+ "grad_norm": 40.03998947143555,
64
+ "learning_rate": 1.9642857142857145e-05,
65
+ "loss": 19.5402783203125,
66
+ "step": 100
67
+ },
68
+ {
69
+ "epoch": 1.4880952380952381,
70
+ "grad_norm": 10.218520164489746,
71
+ "learning_rate": 2.4603174603174602e-05,
72
+ "loss": 18.0630078125,
73
+ "step": 125
74
+ },
75
+ {
76
+ "epoch": 1.7857142857142856,
77
+ "grad_norm": 9.290128707885742,
78
+ "learning_rate": 2.9563492063492066e-05,
79
+ "loss": 16.5726025390625,
80
+ "step": 150
81
+ },
82
+ {
83
+ "epoch": 2.0,
84
+ "eval_loss": 10.262517929077148,
85
+ "eval_map": 0.0774,
86
+ "eval_map_50": 0.1221,
87
+ "eval_map_75": 0.0758,
88
+ "eval_map_group": 0.0806,
89
+ "eval_map_image": 0.1143,
90
+ "eval_map_large": 0.1336,
91
+ "eval_map_medium": 0.0946,
92
+ "eval_map_rectangle": 0.0612,
93
+ "eval_map_small": 0.0293,
94
+ "eval_map_text": 0.0535,
95
+ "eval_mar_1": 0.041,
96
+ "eval_mar_10": 0.1849,
97
+ "eval_mar_100": 0.3597,
98
+ "eval_mar_100_group": 0.3638,
99
+ "eval_mar_100_image": 0.4799,
100
+ "eval_mar_100_rectangle": 0.362,
101
+ "eval_mar_100_text": 0.2332,
102
+ "eval_mar_large": 0.5727,
103
+ "eval_mar_medium": 0.431,
104
+ "eval_mar_small": 0.1654,
105
+ "eval_runtime": 17.3736,
106
+ "eval_samples_per_second": 6.907,
107
+ "eval_steps_per_second": 0.863,
108
+ "step": 168
109
+ },
110
+ {
111
+ "epoch": 2.0833333333333335,
112
+ "grad_norm": 7.967964172363281,
113
+ "learning_rate": 3.4523809523809526e-05,
114
+ "loss": 15.704903564453126,
115
+ "step": 175
116
+ },
117
+ {
118
+ "epoch": 2.380952380952381,
119
+ "grad_norm": 14.558771133422852,
120
+ "learning_rate": 3.9484126984126986e-05,
121
+ "loss": 14.5267236328125,
122
+ "step": 200
123
+ },
124
+ {
125
+ "epoch": 2.678571428571429,
126
+ "grad_norm": 9.619315147399902,
127
+ "learning_rate": 4.4444444444444447e-05,
128
+ "loss": 13.92162353515625,
129
+ "step": 225
130
+ },
131
+ {
132
+ "epoch": 2.9761904761904763,
133
+ "grad_norm": 8.275788307189941,
134
+ "learning_rate": 4.940476190476191e-05,
135
+ "loss": 13.8275439453125,
136
+ "step": 250
137
+ },
138
+ {
139
+ "epoch": 3.0,
140
+ "eval_loss": 8.35128116607666,
141
+ "eval_map": 0.1082,
142
+ "eval_map_50": 0.1593,
143
+ "eval_map_75": 0.1049,
144
+ "eval_map_group": 0.0831,
145
+ "eval_map_image": 0.1796,
146
+ "eval_map_large": 0.2034,
147
+ "eval_map_medium": 0.1423,
148
+ "eval_map_rectangle": 0.1099,
149
+ "eval_map_small": 0.0428,
150
+ "eval_map_text": 0.0602,
151
+ "eval_mar_1": 0.0448,
152
+ "eval_mar_10": 0.1995,
153
+ "eval_mar_100": 0.4293,
154
+ "eval_mar_100_group": 0.4094,
155
+ "eval_mar_100_image": 0.5438,
156
+ "eval_mar_100_rectangle": 0.4053,
157
+ "eval_mar_100_text": 0.3589,
158
+ "eval_mar_large": 0.6945,
159
+ "eval_mar_medium": 0.4812,
160
+ "eval_mar_small": 0.2377,
161
+ "eval_runtime": 17.5818,
162
+ "eval_samples_per_second": 6.825,
163
+ "eval_steps_per_second": 0.853,
164
+ "step": 252
165
+ },
166
+ {
167
+ "epoch": 3.2738095238095237,
168
+ "grad_norm": 17.83608055114746,
169
+ "learning_rate": 4.951499118165785e-05,
170
+ "loss": 13.419459228515626,
171
+ "step": 275
172
+ },
173
+ {
174
+ "epoch": 3.571428571428571,
175
+ "grad_norm": 15.467687606811523,
176
+ "learning_rate": 4.8963844797178134e-05,
177
+ "loss": 13.36093994140625,
178
+ "step": 300
179
+ },
180
+ {
181
+ "epoch": 3.869047619047619,
182
+ "grad_norm": 6.873251438140869,
183
+ "learning_rate": 4.841269841269841e-05,
184
+ "loss": 12.94340576171875,
185
+ "step": 325
186
+ },
187
+ {
188
+ "epoch": 4.0,
189
+ "eval_loss": 8.083844184875488,
190
+ "eval_map": 0.1171,
191
+ "eval_map_50": 0.1741,
192
+ "eval_map_75": 0.1167,
193
+ "eval_map_group": 0.064,
194
+ "eval_map_image": 0.2013,
195
+ "eval_map_large": 0.2186,
196
+ "eval_map_medium": 0.1593,
197
+ "eval_map_rectangle": 0.1426,
198
+ "eval_map_small": 0.0463,
199
+ "eval_map_text": 0.0604,
200
+ "eval_mar_1": 0.0411,
201
+ "eval_mar_10": 0.2116,
202
+ "eval_mar_100": 0.4439,
203
+ "eval_mar_100_group": 0.4459,
204
+ "eval_mar_100_image": 0.5678,
205
+ "eval_mar_100_rectangle": 0.4243,
206
+ "eval_mar_100_text": 0.3375,
207
+ "eval_mar_large": 0.7398,
208
+ "eval_mar_medium": 0.5069,
209
+ "eval_mar_small": 0.2457,
210
+ "eval_runtime": 18.0359,
211
+ "eval_samples_per_second": 6.653,
212
+ "eval_steps_per_second": 0.832,
213
+ "step": 336
214
+ },
215
+ {
216
+ "epoch": 4.166666666666667,
217
+ "grad_norm": 14.644241333007812,
218
+ "learning_rate": 4.78615520282187e-05,
219
+ "loss": 12.36754150390625,
220
+ "step": 350
221
+ },
222
+ {
223
+ "epoch": 4.464285714285714,
224
+ "grad_norm": 9.411576271057129,
225
+ "learning_rate": 4.731040564373898e-05,
226
+ "loss": 12.7791748046875,
227
+ "step": 375
228
+ },
229
+ {
230
+ "epoch": 4.761904761904762,
231
+ "grad_norm": 14.686434745788574,
232
+ "learning_rate": 4.675925925925926e-05,
233
+ "loss": 12.952034912109376,
234
+ "step": 400
235
+ },
236
+ {
237
+ "epoch": 5.0,
238
+ "eval_loss": 7.995185375213623,
239
+ "eval_map": 0.1284,
240
+ "eval_map_50": 0.1931,
241
+ "eval_map_75": 0.1248,
242
+ "eval_map_group": 0.0539,
243
+ "eval_map_image": 0.2066,
244
+ "eval_map_large": 0.2224,
245
+ "eval_map_medium": 0.1772,
246
+ "eval_map_rectangle": 0.1552,
247
+ "eval_map_small": 0.06,
248
+ "eval_map_text": 0.0978,
249
+ "eval_mar_1": 0.0435,
250
+ "eval_mar_10": 0.2236,
251
+ "eval_mar_100": 0.4568,
252
+ "eval_mar_100_group": 0.4465,
253
+ "eval_mar_100_image": 0.558,
254
+ "eval_mar_100_rectangle": 0.4388,
255
+ "eval_mar_100_text": 0.384,
256
+ "eval_mar_large": 0.7415,
257
+ "eval_mar_medium": 0.5216,
258
+ "eval_mar_small": 0.2552,
259
+ "eval_runtime": 17.6743,
260
+ "eval_samples_per_second": 6.79,
261
+ "eval_steps_per_second": 0.849,
262
+ "step": 420
263
+ },
264
+ {
265
+ "epoch": 5.059523809523809,
266
+ "grad_norm": 14.872081756591797,
267
+ "learning_rate": 4.620811287477954e-05,
268
+ "loss": 12.8186669921875,
269
+ "step": 425
270
+ },
271
+ {
272
+ "epoch": 5.357142857142857,
273
+ "grad_norm": 14.947751998901367,
274
+ "learning_rate": 4.5656966490299825e-05,
275
+ "loss": 12.421568603515626,
276
+ "step": 450
277
+ },
278
+ {
279
+ "epoch": 5.654761904761905,
280
+ "grad_norm": 14.387224197387695,
281
+ "learning_rate": 4.510582010582011e-05,
282
+ "loss": 12.860526123046874,
283
+ "step": 475
284
+ },
285
+ {
286
+ "epoch": 5.9523809523809526,
287
+ "grad_norm": 11.880175590515137,
288
+ "learning_rate": 4.455467372134039e-05,
289
+ "loss": 12.392239990234375,
290
+ "step": 500
291
+ },
292
+ {
293
+ "epoch": 6.0,
294
+ "eval_loss": 7.908458232879639,
295
+ "eval_map": 0.123,
296
+ "eval_map_50": 0.18,
297
+ "eval_map_75": 0.1191,
298
+ "eval_map_group": 0.0441,
299
+ "eval_map_image": 0.2175,
300
+ "eval_map_large": 0.2555,
301
+ "eval_map_medium": 0.175,
302
+ "eval_map_rectangle": 0.1501,
303
+ "eval_map_small": 0.0541,
304
+ "eval_map_text": 0.0801,
305
+ "eval_mar_1": 0.0432,
306
+ "eval_mar_10": 0.2122,
307
+ "eval_mar_100": 0.4464,
308
+ "eval_mar_100_group": 0.4276,
309
+ "eval_mar_100_image": 0.588,
310
+ "eval_mar_100_rectangle": 0.4424,
311
+ "eval_mar_100_text": 0.3274,
312
+ "eval_mar_large": 0.7738,
313
+ "eval_mar_medium": 0.5237,
314
+ "eval_mar_small": 0.2375,
315
+ "eval_runtime": 17.6011,
316
+ "eval_samples_per_second": 6.818,
317
+ "eval_steps_per_second": 0.852,
318
+ "step": 504
319
+ },
320
+ {
321
+ "epoch": 6.25,
322
+ "grad_norm": 24.597919464111328,
323
+ "learning_rate": 4.400352733686067e-05,
324
+ "loss": 12.41754150390625,
325
+ "step": 525
326
+ },
327
+ {
328
+ "epoch": 6.5476190476190474,
329
+ "grad_norm": 11.277619361877441,
330
+ "learning_rate": 4.345238095238096e-05,
331
+ "loss": 12.266273193359375,
332
+ "step": 550
333
+ },
334
+ {
335
+ "epoch": 6.845238095238095,
336
+ "grad_norm": 36.6771354675293,
337
+ "learning_rate": 4.290123456790124e-05,
338
+ "loss": 11.820712890625,
339
+ "step": 575
340
+ },
341
+ {
342
+ "epoch": 7.0,
343
+ "eval_loss": 7.85192346572876,
344
+ "eval_map": 0.1266,
345
+ "eval_map_50": 0.1846,
346
+ "eval_map_75": 0.1225,
347
+ "eval_map_group": 0.0519,
348
+ "eval_map_image": 0.2088,
349
+ "eval_map_large": 0.2261,
350
+ "eval_map_medium": 0.1858,
351
+ "eval_map_rectangle": 0.1674,
352
+ "eval_map_small": 0.0571,
353
+ "eval_map_text": 0.0785,
354
+ "eval_mar_1": 0.043,
355
+ "eval_mar_10": 0.2199,
356
+ "eval_mar_100": 0.4571,
357
+ "eval_mar_100_group": 0.4622,
358
+ "eval_mar_100_image": 0.5641,
359
+ "eval_mar_100_rectangle": 0.4543,
360
+ "eval_mar_100_text": 0.3479,
361
+ "eval_mar_large": 0.7813,
362
+ "eval_mar_medium": 0.5405,
363
+ "eval_mar_small": 0.2422,
364
+ "eval_runtime": 17.7165,
365
+ "eval_samples_per_second": 6.773,
366
+ "eval_steps_per_second": 0.847,
367
+ "step": 588
368
+ },
369
+ {
370
+ "epoch": 7.142857142857143,
371
+ "grad_norm": 20.0545711517334,
372
+ "learning_rate": 4.235008818342152e-05,
373
+ "loss": 12.802718505859374,
374
+ "step": 600
375
+ },
376
+ {
377
+ "epoch": 7.440476190476191,
378
+ "grad_norm": 15.03058910369873,
379
+ "learning_rate": 4.17989417989418e-05,
380
+ "loss": 12.179630126953125,
381
+ "step": 625
382
+ },
383
+ {
384
+ "epoch": 7.738095238095238,
385
+ "grad_norm": 7.166962623596191,
386
+ "learning_rate": 4.124779541446208e-05,
387
+ "loss": 11.9717578125,
388
+ "step": 650
389
+ },
390
+ {
391
+ "epoch": 8.0,
392
+ "eval_loss": 7.762953281402588,
393
+ "eval_map": 0.1389,
394
+ "eval_map_50": 0.2028,
395
+ "eval_map_75": 0.1353,
396
+ "eval_map_group": 0.0552,
397
+ "eval_map_image": 0.2193,
398
+ "eval_map_large": 0.2511,
399
+ "eval_map_medium": 0.197,
400
+ "eval_map_rectangle": 0.177,
401
+ "eval_map_small": 0.066,
402
+ "eval_map_text": 0.1041,
403
+ "eval_mar_1": 0.0432,
404
+ "eval_mar_10": 0.2317,
405
+ "eval_mar_100": 0.4742,
406
+ "eval_mar_100_group": 0.4814,
407
+ "eval_mar_100_image": 0.5825,
408
+ "eval_mar_100_rectangle": 0.4582,
409
+ "eval_mar_100_text": 0.3747,
410
+ "eval_mar_large": 0.761,
411
+ "eval_mar_medium": 0.5526,
412
+ "eval_mar_small": 0.2631,
413
+ "eval_runtime": 17.6278,
414
+ "eval_samples_per_second": 6.807,
415
+ "eval_steps_per_second": 0.851,
416
+ "step": 672
417
+ },
418
+ {
419
+ "epoch": 8.035714285714286,
420
+ "grad_norm": 10.33957290649414,
421
+ "learning_rate": 4.0696649029982364e-05,
422
+ "loss": 11.71945556640625,
423
+ "step": 675
424
+ },
425
+ {
426
+ "epoch": 8.333333333333334,
427
+ "grad_norm": 11.141268730163574,
428
+ "learning_rate": 4.014550264550265e-05,
429
+ "loss": 12.104078369140625,
430
+ "step": 700
431
+ },
432
+ {
433
+ "epoch": 8.630952380952381,
434
+ "grad_norm": 8.50006103515625,
435
+ "learning_rate": 3.959435626102293e-05,
436
+ "loss": 12.10205322265625,
437
+ "step": 725
438
+ },
439
+ {
440
+ "epoch": 8.928571428571429,
441
+ "grad_norm": 12.563775062561035,
442
+ "learning_rate": 3.904320987654321e-05,
443
+ "loss": 11.8281201171875,
444
+ "step": 750
445
+ },
446
+ {
447
+ "epoch": 9.0,
448
+ "eval_loss": 7.723588466644287,
449
+ "eval_map": 0.1317,
450
+ "eval_map_50": 0.186,
451
+ "eval_map_75": 0.1298,
452
+ "eval_map_group": 0.0554,
453
+ "eval_map_image": 0.2197,
454
+ "eval_map_large": 0.2512,
455
+ "eval_map_medium": 0.1925,
456
+ "eval_map_rectangle": 0.1777,
457
+ "eval_map_small": 0.0607,
458
+ "eval_map_text": 0.0739,
459
+ "eval_mar_1": 0.043,
460
+ "eval_mar_10": 0.2254,
461
+ "eval_mar_100": 0.4671,
462
+ "eval_mar_100_group": 0.4945,
463
+ "eval_mar_100_image": 0.5935,
464
+ "eval_mar_100_rectangle": 0.4602,
465
+ "eval_mar_100_text": 0.32,
466
+ "eval_mar_large": 0.7856,
467
+ "eval_mar_medium": 0.5534,
468
+ "eval_mar_small": 0.2523,
469
+ "eval_runtime": 17.6923,
470
+ "eval_samples_per_second": 6.783,
471
+ "eval_steps_per_second": 0.848,
472
+ "step": 756
473
+ },
474
+ {
475
+ "epoch": 9.226190476190476,
476
+ "grad_norm": 15.43812370300293,
477
+ "learning_rate": 3.84920634920635e-05,
478
+ "loss": 11.588818359375,
479
+ "step": 775
480
+ },
481
+ {
482
+ "epoch": 9.523809523809524,
483
+ "grad_norm": 33.323638916015625,
484
+ "learning_rate": 3.794091710758378e-05,
485
+ "loss": 11.961219482421875,
486
+ "step": 800
487
+ },
488
+ {
489
+ "epoch": 9.821428571428571,
490
+ "grad_norm": 23.318923950195312,
491
+ "learning_rate": 3.7389770723104055e-05,
492
+ "loss": 11.79553955078125,
493
+ "step": 825
494
+ },
495
+ {
496
+ "epoch": 10.0,
497
+ "eval_loss": 7.686021327972412,
498
+ "eval_map": 0.1389,
499
+ "eval_map_50": 0.1989,
500
+ "eval_map_75": 0.1353,
501
+ "eval_map_group": 0.0604,
502
+ "eval_map_image": 0.2208,
503
+ "eval_map_large": 0.2665,
504
+ "eval_map_medium": 0.201,
505
+ "eval_map_rectangle": 0.1802,
506
+ "eval_map_small": 0.0685,
507
+ "eval_map_text": 0.0944,
508
+ "eval_mar_1": 0.0451,
509
+ "eval_mar_10": 0.2327,
510
+ "eval_mar_100": 0.4797,
511
+ "eval_mar_100_group": 0.506,
512
+ "eval_mar_100_image": 0.5941,
513
+ "eval_mar_100_rectangle": 0.4599,
514
+ "eval_mar_100_text": 0.359,
515
+ "eval_mar_large": 0.8045,
516
+ "eval_mar_medium": 0.568,
517
+ "eval_mar_small": 0.2633,
518
+ "eval_runtime": 17.2713,
519
+ "eval_samples_per_second": 6.948,
520
+ "eval_steps_per_second": 0.868,
521
+ "step": 840
522
+ },
523
+ {
524
+ "epoch": 10.119047619047619,
525
+ "grad_norm": 21.750789642333984,
526
+ "learning_rate": 3.683862433862434e-05,
527
+ "loss": 11.53491943359375,
528
+ "step": 850
529
+ },
530
+ {
531
+ "epoch": 10.416666666666666,
532
+ "grad_norm": 12.808640480041504,
533
+ "learning_rate": 3.628747795414462e-05,
534
+ "loss": 11.769920654296875,
535
+ "step": 875
536
+ },
537
+ {
538
+ "epoch": 10.714285714285714,
539
+ "grad_norm": 12.053258895874023,
540
+ "learning_rate": 3.5736331569664904e-05,
541
+ "loss": 11.778603515625,
542
+ "step": 900
543
+ },
544
+ {
545
+ "epoch": 11.0,
546
+ "eval_loss": 7.661948204040527,
547
+ "eval_map": 0.1456,
548
+ "eval_map_50": 0.2122,
549
+ "eval_map_75": 0.1431,
550
+ "eval_map_group": 0.0649,
551
+ "eval_map_image": 0.2302,
552
+ "eval_map_large": 0.2814,
553
+ "eval_map_medium": 0.2067,
554
+ "eval_map_rectangle": 0.1763,
555
+ "eval_map_small": 0.0763,
556
+ "eval_map_text": 0.1111,
557
+ "eval_mar_1": 0.0445,
558
+ "eval_mar_10": 0.2399,
559
+ "eval_mar_100": 0.4916,
560
+ "eval_mar_100_group": 0.5073,
561
+ "eval_mar_100_image": 0.6075,
562
+ "eval_mar_100_rectangle": 0.4558,
563
+ "eval_mar_100_text": 0.3955,
564
+ "eval_mar_large": 0.7904,
565
+ "eval_mar_medium": 0.5715,
566
+ "eval_mar_small": 0.2859,
567
+ "eval_runtime": 17.5947,
568
+ "eval_samples_per_second": 6.82,
569
+ "eval_steps_per_second": 0.853,
570
+ "step": 924
571
+ },
572
+ {
573
+ "epoch": 11.011904761904763,
574
+ "grad_norm": 10.250245094299316,
575
+ "learning_rate": 3.518518518518519e-05,
576
+ "loss": 12.0818701171875,
577
+ "step": 925
578
+ },
579
+ {
580
+ "epoch": 11.30952380952381,
581
+ "grad_norm": 28.736799240112305,
582
+ "learning_rate": 3.463403880070547e-05,
583
+ "loss": 11.669910888671875,
584
+ "step": 950
585
+ },
586
+ {
587
+ "epoch": 11.607142857142858,
588
+ "grad_norm": 32.78938293457031,
589
+ "learning_rate": 3.408289241622575e-05,
590
+ "loss": 11.80724853515625,
591
+ "step": 975
592
+ },
593
+ {
594
+ "epoch": 11.904761904761905,
595
+ "grad_norm": 14.23360824584961,
596
+ "learning_rate": 3.353174603174603e-05,
597
+ "loss": 11.633603515625,
598
+ "step": 1000
599
+ },
600
+ {
601
+ "epoch": 12.0,
602
+ "eval_loss": 7.61862325668335,
603
+ "eval_map": 0.1452,
604
+ "eval_map_50": 0.2085,
605
+ "eval_map_75": 0.1433,
606
+ "eval_map_group": 0.0673,
607
+ "eval_map_image": 0.2435,
608
+ "eval_map_large": 0.2939,
609
+ "eval_map_medium": 0.2001,
610
+ "eval_map_rectangle": 0.1766,
611
+ "eval_map_small": 0.0697,
612
+ "eval_map_text": 0.0935,
613
+ "eval_mar_1": 0.0465,
614
+ "eval_mar_10": 0.2467,
615
+ "eval_mar_100": 0.4811,
616
+ "eval_mar_100_group": 0.5087,
617
+ "eval_mar_100_image": 0.6105,
618
+ "eval_mar_100_rectangle": 0.4571,
619
+ "eval_mar_100_text": 0.3481,
620
+ "eval_mar_large": 0.7906,
621
+ "eval_mar_medium": 0.5665,
622
+ "eval_mar_small": 0.273,
623
+ "eval_runtime": 17.2166,
624
+ "eval_samples_per_second": 6.97,
625
+ "eval_steps_per_second": 0.871,
626
+ "step": 1008
627
+ },
628
+ {
629
+ "epoch": 12.202380952380953,
630
+ "grad_norm": 56.82817840576172,
631
+ "learning_rate": 3.2980599647266316e-05,
632
+ "loss": 11.56818603515625,
633
+ "step": 1025
634
+ },
635
+ {
636
+ "epoch": 12.5,
637
+ "grad_norm": 21.191076278686523,
638
+ "learning_rate": 3.2429453262786595e-05,
639
+ "loss": 11.379783935546875,
640
+ "step": 1050
641
+ },
642
+ {
643
+ "epoch": 12.797619047619047,
644
+ "grad_norm": 48.60485076904297,
645
+ "learning_rate": 3.187830687830688e-05,
646
+ "loss": 11.505103759765625,
647
+ "step": 1075
648
+ },
649
+ {
650
+ "epoch": 13.0,
651
+ "eval_loss": 7.647872447967529,
652
+ "eval_map": 0.1367,
653
+ "eval_map_50": 0.1944,
654
+ "eval_map_75": 0.1348,
655
+ "eval_map_group": 0.0665,
656
+ "eval_map_image": 0.2308,
657
+ "eval_map_large": 0.2837,
658
+ "eval_map_medium": 0.201,
659
+ "eval_map_rectangle": 0.1654,
660
+ "eval_map_small": 0.0661,
661
+ "eval_map_text": 0.0839,
662
+ "eval_mar_1": 0.0456,
663
+ "eval_mar_10": 0.2329,
664
+ "eval_mar_100": 0.4692,
665
+ "eval_mar_100_group": 0.5001,
666
+ "eval_mar_100_image": 0.5892,
667
+ "eval_mar_100_rectangle": 0.4515,
668
+ "eval_mar_100_text": 0.3359,
669
+ "eval_mar_large": 0.7908,
670
+ "eval_mar_medium": 0.5583,
671
+ "eval_mar_small": 0.2496,
672
+ "eval_runtime": 17.2376,
673
+ "eval_samples_per_second": 6.962,
674
+ "eval_steps_per_second": 0.87,
675
+ "step": 1092
676
+ },
677
+ {
678
+ "epoch": 13.095238095238095,
679
+ "grad_norm": 33.55184555053711,
680
+ "learning_rate": 3.1327160493827165e-05,
681
+ "loss": 11.693345947265625,
682
+ "step": 1100
683
+ },
684
+ {
685
+ "epoch": 13.392857142857142,
686
+ "grad_norm": 10.436372756958008,
687
+ "learning_rate": 3.0776014109347444e-05,
688
+ "loss": 11.6796435546875,
689
+ "step": 1125
690
+ },
691
+ {
692
+ "epoch": 13.69047619047619,
693
+ "grad_norm": 18.514883041381836,
694
+ "learning_rate": 3.022486772486773e-05,
695
+ "loss": 11.21151611328125,
696
+ "step": 1150
697
+ },
698
+ {
699
+ "epoch": 13.988095238095237,
700
+ "grad_norm": 10.212114334106445,
701
+ "learning_rate": 2.967372134038801e-05,
702
+ "loss": 11.76965576171875,
703
+ "step": 1175
704
+ },
705
+ {
706
+ "epoch": 14.0,
707
+ "eval_loss": 7.631312370300293,
708
+ "eval_map": 0.1524,
709
+ "eval_map_50": 0.2192,
710
+ "eval_map_75": 0.15,
711
+ "eval_map_group": 0.0797,
712
+ "eval_map_image": 0.2496,
713
+ "eval_map_large": 0.2967,
714
+ "eval_map_medium": 0.213,
715
+ "eval_map_rectangle": 0.1743,
716
+ "eval_map_small": 0.0767,
717
+ "eval_map_text": 0.1059,
718
+ "eval_mar_1": 0.0481,
719
+ "eval_mar_10": 0.2508,
720
+ "eval_mar_100": 0.4937,
721
+ "eval_mar_100_group": 0.5226,
722
+ "eval_mar_100_image": 0.6179,
723
+ "eval_mar_100_rectangle": 0.4513,
724
+ "eval_mar_100_text": 0.383,
725
+ "eval_mar_large": 0.7914,
726
+ "eval_mar_medium": 0.578,
727
+ "eval_mar_small": 0.2893,
728
+ "eval_runtime": 17.3512,
729
+ "eval_samples_per_second": 6.916,
730
+ "eval_steps_per_second": 0.864,
731
+ "step": 1176
732
+ },
733
+ {
734
+ "epoch": 14.285714285714286,
735
+ "grad_norm": 35.04265213012695,
736
+ "learning_rate": 2.912257495590829e-05,
737
+ "loss": 11.576104736328125,
738
+ "step": 1200
739
+ },
740
+ {
741
+ "epoch": 14.583333333333334,
742
+ "grad_norm": 32.3892822265625,
743
+ "learning_rate": 2.857142857142857e-05,
744
+ "loss": 11.311810302734376,
745
+ "step": 1225
746
+ },
747
+ {
748
+ "epoch": 14.880952380952381,
749
+ "grad_norm": 44.537376403808594,
750
+ "learning_rate": 2.8020282186948853e-05,
751
+ "loss": 11.286588134765625,
752
+ "step": 1250
753
+ },
754
+ {
755
+ "epoch": 15.0,
756
+ "eval_loss": 7.60584020614624,
757
+ "eval_map": 0.1544,
758
+ "eval_map_50": 0.2216,
759
+ "eval_map_75": 0.1513,
760
+ "eval_map_group": 0.0822,
761
+ "eval_map_image": 0.249,
762
+ "eval_map_large": 0.3055,
763
+ "eval_map_medium": 0.2181,
764
+ "eval_map_rectangle": 0.1776,
765
+ "eval_map_small": 0.0816,
766
+ "eval_map_text": 0.1087,
767
+ "eval_mar_1": 0.0505,
768
+ "eval_mar_10": 0.2549,
769
+ "eval_mar_100": 0.4948,
770
+ "eval_mar_100_group": 0.5213,
771
+ "eval_mar_100_image": 0.6152,
772
+ "eval_mar_100_rectangle": 0.4614,
773
+ "eval_mar_100_text": 0.3812,
774
+ "eval_mar_large": 0.7931,
775
+ "eval_mar_medium": 0.5825,
776
+ "eval_mar_small": 0.2855,
777
+ "eval_runtime": 17.0444,
778
+ "eval_samples_per_second": 7.04,
779
+ "eval_steps_per_second": 0.88,
780
+ "step": 1260
781
+ },
782
+ {
783
+ "epoch": 15.178571428571429,
784
+ "grad_norm": 10.380435943603516,
785
+ "learning_rate": 2.7469135802469138e-05,
786
+ "loss": 11.5576953125,
787
+ "step": 1275
788
+ },
789
+ {
790
+ "epoch": 15.476190476190476,
791
+ "grad_norm": 12.200742721557617,
792
+ "learning_rate": 2.691798941798942e-05,
793
+ "loss": 11.44038818359375,
794
+ "step": 1300
795
+ },
796
+ {
797
+ "epoch": 15.773809523809524,
798
+ "grad_norm": 9.843217849731445,
799
+ "learning_rate": 2.63668430335097e-05,
800
+ "loss": 10.94272216796875,
801
+ "step": 1325
802
+ },
803
+ {
804
+ "epoch": 16.0,
805
+ "eval_loss": 7.568243980407715,
806
+ "eval_map": 0.1551,
807
+ "eval_map_50": 0.2188,
808
+ "eval_map_75": 0.1537,
809
+ "eval_map_group": 0.0866,
810
+ "eval_map_image": 0.2522,
811
+ "eval_map_large": 0.3189,
812
+ "eval_map_medium": 0.2193,
813
+ "eval_map_rectangle": 0.1842,
814
+ "eval_map_small": 0.0744,
815
+ "eval_map_text": 0.0972,
816
+ "eval_mar_1": 0.0513,
817
+ "eval_mar_10": 0.2521,
818
+ "eval_mar_100": 0.4899,
819
+ "eval_mar_100_group": 0.5293,
820
+ "eval_mar_100_image": 0.613,
821
+ "eval_mar_100_rectangle": 0.462,
822
+ "eval_mar_100_text": 0.3554,
823
+ "eval_mar_large": 0.8016,
824
+ "eval_mar_medium": 0.5813,
825
+ "eval_mar_small": 0.2772,
826
+ "eval_runtime": 17.2934,
827
+ "eval_samples_per_second": 6.939,
828
+ "eval_steps_per_second": 0.867,
829
+ "step": 1344
830
+ },
831
+ {
832
+ "epoch": 16.071428571428573,
833
+ "grad_norm": 11.41603946685791,
834
+ "learning_rate": 2.5815696649029987e-05,
835
+ "loss": 11.799744873046874,
836
+ "step": 1350
837
+ },
838
+ {
839
+ "epoch": 16.36904761904762,
840
+ "grad_norm": 10.90324878692627,
841
+ "learning_rate": 2.526455026455027e-05,
842
+ "loss": 11.40052978515625,
843
+ "step": 1375
844
+ },
845
+ {
846
+ "epoch": 16.666666666666668,
847
+ "grad_norm": 19.619916915893555,
848
+ "learning_rate": 2.471340388007055e-05,
849
+ "loss": 11.129947509765625,
850
+ "step": 1400
851
+ },
852
+ {
853
+ "epoch": 16.964285714285715,
854
+ "grad_norm": 20.032556533813477,
855
+ "learning_rate": 2.416225749559083e-05,
856
+ "loss": 11.209949951171875,
857
+ "step": 1425
858
+ },
859
+ {
860
+ "epoch": 17.0,
861
+ "eval_loss": 7.599889755249023,
862
+ "eval_map": 0.1529,
863
+ "eval_map_50": 0.2152,
864
+ "eval_map_75": 0.1518,
865
+ "eval_map_group": 0.0918,
866
+ "eval_map_image": 0.2452,
867
+ "eval_map_large": 0.3052,
868
+ "eval_map_medium": 0.2287,
869
+ "eval_map_rectangle": 0.1826,
870
+ "eval_map_small": 0.0755,
871
+ "eval_map_text": 0.0918,
872
+ "eval_mar_1": 0.0481,
873
+ "eval_mar_10": 0.2552,
874
+ "eval_mar_100": 0.4926,
875
+ "eval_mar_100_group": 0.5311,
876
+ "eval_mar_100_image": 0.6157,
877
+ "eval_mar_100_rectangle": 0.4654,
878
+ "eval_mar_100_text": 0.3585,
879
+ "eval_mar_large": 0.8057,
880
+ "eval_mar_medium": 0.5831,
881
+ "eval_mar_small": 0.2802,
882
+ "eval_runtime": 17.1006,
883
+ "eval_samples_per_second": 7.017,
884
+ "eval_steps_per_second": 0.877,
885
+ "step": 1428
886
+ },
887
+ {
888
+ "epoch": 17.261904761904763,
889
+ "grad_norm": 17.242233276367188,
890
+ "learning_rate": 2.361111111111111e-05,
891
+ "loss": 11.399385986328125,
892
+ "step": 1450
893
+ },
894
+ {
895
+ "epoch": 17.55952380952381,
896
+ "grad_norm": 13.795672416687012,
897
+ "learning_rate": 2.3059964726631396e-05,
898
+ "loss": 11.417935791015625,
899
+ "step": 1475
900
+ },
901
+ {
902
+ "epoch": 17.857142857142858,
903
+ "grad_norm": 11.631192207336426,
904
+ "learning_rate": 2.2508818342151678e-05,
905
+ "loss": 10.97098876953125,
906
+ "step": 1500
907
+ },
908
+ {
909
+ "epoch": 18.0,
910
+ "eval_loss": 7.5713324546813965,
911
+ "eval_map": 0.1577,
912
+ "eval_map_50": 0.2227,
913
+ "eval_map_75": 0.157,
914
+ "eval_map_group": 0.0951,
915
+ "eval_map_image": 0.2512,
916
+ "eval_map_large": 0.3131,
917
+ "eval_map_medium": 0.229,
918
+ "eval_map_rectangle": 0.1884,
919
+ "eval_map_small": 0.0815,
920
+ "eval_map_text": 0.0962,
921
+ "eval_mar_1": 0.0494,
922
+ "eval_mar_10": 0.2586,
923
+ "eval_mar_100": 0.4979,
924
+ "eval_mar_100_group": 0.5349,
925
+ "eval_mar_100_image": 0.6257,
926
+ "eval_mar_100_rectangle": 0.4593,
927
+ "eval_mar_100_text": 0.3716,
928
+ "eval_mar_large": 0.7908,
929
+ "eval_mar_medium": 0.5872,
930
+ "eval_mar_small": 0.292,
931
+ "eval_runtime": 17.1925,
932
+ "eval_samples_per_second": 6.98,
933
+ "eval_steps_per_second": 0.872,
934
+ "step": 1512
935
+ },
936
+ {
937
+ "epoch": 18.154761904761905,
938
+ "grad_norm": 15.366872787475586,
939
+ "learning_rate": 2.1957671957671956e-05,
940
+ "loss": 11.15154541015625,
941
+ "step": 1525
942
+ },
943
+ {
944
+ "epoch": 18.452380952380953,
945
+ "grad_norm": 13.13204574584961,
946
+ "learning_rate": 2.140652557319224e-05,
947
+ "loss": 11.403101806640626,
948
+ "step": 1550
949
+ },
950
+ {
951
+ "epoch": 18.75,
952
+ "grad_norm": 16.772144317626953,
953
+ "learning_rate": 2.0855379188712523e-05,
954
+ "loss": 11.07358642578125,
955
+ "step": 1575
956
+ },
957
+ {
958
+ "epoch": 19.0,
959
+ "eval_loss": 7.5920186042785645,
960
+ "eval_map": 0.1568,
961
+ "eval_map_50": 0.2195,
962
+ "eval_map_75": 0.1546,
963
+ "eval_map_group": 0.0976,
964
+ "eval_map_image": 0.2611,
965
+ "eval_map_large": 0.3225,
966
+ "eval_map_medium": 0.224,
967
+ "eval_map_rectangle": 0.1799,
968
+ "eval_map_small": 0.0759,
969
+ "eval_map_text": 0.0887,
970
+ "eval_mar_1": 0.0493,
971
+ "eval_mar_10": 0.2589,
972
+ "eval_mar_100": 0.4901,
973
+ "eval_mar_100_group": 0.5376,
974
+ "eval_mar_100_image": 0.626,
975
+ "eval_mar_100_rectangle": 0.454,
976
+ "eval_mar_100_text": 0.3428,
977
+ "eval_mar_large": 0.7912,
978
+ "eval_mar_medium": 0.584,
979
+ "eval_mar_small": 0.2779,
980
+ "eval_runtime": 16.8456,
981
+ "eval_samples_per_second": 7.124,
982
+ "eval_steps_per_second": 0.89,
983
+ "step": 1596
984
+ },
985
+ {
986
+ "epoch": 19.047619047619047,
987
+ "grad_norm": 72.46932220458984,
988
+ "learning_rate": 2.0304232804232805e-05,
989
+ "loss": 11.312447509765626,
990
+ "step": 1600
991
+ },
992
+ {
993
+ "epoch": 19.345238095238095,
994
+ "grad_norm": 7.8378801345825195,
995
+ "learning_rate": 1.9753086419753087e-05,
996
+ "loss": 11.34157470703125,
997
+ "step": 1625
998
+ },
999
+ {
1000
+ "epoch": 19.642857142857142,
1001
+ "grad_norm": 14.729228973388672,
1002
+ "learning_rate": 1.920194003527337e-05,
1003
+ "loss": 11.0249072265625,
1004
+ "step": 1650
1005
+ },
1006
+ {
1007
+ "epoch": 19.94047619047619,
1008
+ "grad_norm": 25.199474334716797,
1009
+ "learning_rate": 1.8650793650793654e-05,
1010
+ "loss": 11.217237548828125,
1011
+ "step": 1675
1012
+ },
1013
+ {
1014
+ "epoch": 20.0,
1015
+ "eval_loss": 7.561267375946045,
1016
+ "eval_map": 0.153,
1017
+ "eval_map_50": 0.2144,
1018
+ "eval_map_75": 0.1502,
1019
+ "eval_map_group": 0.0971,
1020
+ "eval_map_image": 0.2449,
1021
+ "eval_map_large": 0.3227,
1022
+ "eval_map_medium": 0.2256,
1023
+ "eval_map_rectangle": 0.1846,
1024
+ "eval_map_small": 0.0726,
1025
+ "eval_map_text": 0.0851,
1026
+ "eval_mar_1": 0.0499,
1027
+ "eval_mar_10": 0.2533,
1028
+ "eval_mar_100": 0.4867,
1029
+ "eval_mar_100_group": 0.5363,
1030
+ "eval_mar_100_image": 0.6226,
1031
+ "eval_mar_100_rectangle": 0.4526,
1032
+ "eval_mar_100_text": 0.3353,
1033
+ "eval_mar_large": 0.8013,
1034
+ "eval_mar_medium": 0.5825,
1035
+ "eval_mar_small": 0.2765,
1036
+ "eval_runtime": 17.0648,
1037
+ "eval_samples_per_second": 7.032,
1038
+ "eval_steps_per_second": 0.879,
1039
+ "step": 1680
1040
+ },
1041
+ {
1042
+ "epoch": 20.238095238095237,
1043
+ "grad_norm": 21.974050521850586,
1044
+ "learning_rate": 1.8099647266313935e-05,
1045
+ "loss": 10.83720458984375,
1046
+ "step": 1700
1047
+ },
1048
+ {
1049
+ "epoch": 20.535714285714285,
1050
+ "grad_norm": 23.206058502197266,
1051
+ "learning_rate": 1.7548500881834214e-05,
1052
+ "loss": 11.15845458984375,
1053
+ "step": 1725
1054
+ },
1055
+ {
1056
+ "epoch": 20.833333333333332,
1057
+ "grad_norm": 29.534772872924805,
1058
+ "learning_rate": 1.69973544973545e-05,
1059
+ "loss": 11.038966064453126,
1060
+ "step": 1750
1061
+ },
1062
+ {
1063
+ "epoch": 21.0,
1064
+ "eval_loss": 7.541738986968994,
1065
+ "eval_map": 0.1597,
1066
+ "eval_map_50": 0.2248,
1067
+ "eval_map_75": 0.1578,
1068
+ "eval_map_group": 0.106,
1069
+ "eval_map_image": 0.2534,
1070
+ "eval_map_large": 0.3218,
1071
+ "eval_map_medium": 0.2289,
1072
+ "eval_map_rectangle": 0.1851,
1073
+ "eval_map_small": 0.0824,
1074
+ "eval_map_text": 0.0945,
1075
+ "eval_mar_1": 0.0504,
1076
+ "eval_mar_10": 0.262,
1077
+ "eval_mar_100": 0.4959,
1078
+ "eval_mar_100_group": 0.5397,
1079
+ "eval_mar_100_image": 0.6128,
1080
+ "eval_mar_100_rectangle": 0.4607,
1081
+ "eval_mar_100_text": 0.3705,
1082
+ "eval_mar_large": 0.7954,
1083
+ "eval_mar_medium": 0.5832,
1084
+ "eval_mar_small": 0.2921,
1085
+ "eval_runtime": 17.3182,
1086
+ "eval_samples_per_second": 6.929,
1087
+ "eval_steps_per_second": 0.866,
1088
+ "step": 1764
1089
+ },
1090
+ {
1091
+ "epoch": 21.13095238095238,
1092
+ "grad_norm": 12.260412216186523,
1093
+ "learning_rate": 1.644620811287478e-05,
1094
+ "loss": 11.237501220703125,
1095
+ "step": 1775
1096
+ },
1097
+ {
1098
+ "epoch": 21.428571428571427,
1099
+ "grad_norm": 8.769057273864746,
1100
+ "learning_rate": 1.5895061728395063e-05,
1101
+ "loss": 11.0806005859375,
1102
+ "step": 1800
1103
+ },
1104
+ {
1105
+ "epoch": 21.726190476190474,
1106
+ "grad_norm": 22.044124603271484,
1107
+ "learning_rate": 1.5343915343915344e-05,
1108
+ "loss": 11.148917236328124,
1109
+ "step": 1825
1110
+ },
1111
+ {
1112
+ "epoch": 22.0,
1113
+ "eval_loss": 7.538026332855225,
1114
+ "eval_map": 0.1599,
1115
+ "eval_map_50": 0.224,
1116
+ "eval_map_75": 0.1569,
1117
+ "eval_map_group": 0.1082,
1118
+ "eval_map_image": 0.2527,
1119
+ "eval_map_large": 0.3306,
1120
+ "eval_map_medium": 0.2308,
1121
+ "eval_map_rectangle": 0.1882,
1122
+ "eval_map_small": 0.0783,
1123
+ "eval_map_text": 0.0906,
1124
+ "eval_mar_1": 0.0488,
1125
+ "eval_mar_10": 0.2596,
1126
+ "eval_mar_100": 0.4935,
1127
+ "eval_mar_100_group": 0.5411,
1128
+ "eval_mar_100_image": 0.6195,
1129
+ "eval_mar_100_rectangle": 0.4587,
1130
+ "eval_mar_100_text": 0.3547,
1131
+ "eval_mar_large": 0.7987,
1132
+ "eval_mar_medium": 0.5876,
1133
+ "eval_mar_small": 0.2839,
1134
+ "eval_runtime": 17.1176,
1135
+ "eval_samples_per_second": 7.01,
1136
+ "eval_steps_per_second": 0.876,
1137
+ "step": 1848
1138
+ },
1139
+ {
1140
+ "epoch": 22.023809523809526,
1141
+ "grad_norm": 10.205994606018066,
1142
+ "learning_rate": 1.4792768959435626e-05,
1143
+ "loss": 11.559412841796876,
1144
+ "step": 1850
1145
+ },
1146
+ {
1147
+ "epoch": 22.321428571428573,
1148
+ "grad_norm": 7.906266212463379,
1149
+ "learning_rate": 1.424162257495591e-05,
1150
+ "loss": 11.12822998046875,
1151
+ "step": 1875
1152
+ },
1153
+ {
1154
+ "epoch": 22.61904761904762,
1155
+ "grad_norm": 10.976849555969238,
1156
+ "learning_rate": 1.3690476190476192e-05,
1157
+ "loss": 10.973646240234375,
1158
+ "step": 1900
1159
+ },
1160
+ {
1161
+ "epoch": 22.916666666666668,
1162
+ "grad_norm": 17.911376953125,
1163
+ "learning_rate": 1.3139329805996472e-05,
1164
+ "loss": 10.757685546875,
1165
+ "step": 1925
1166
+ },
1167
+ {
1168
+ "epoch": 23.0,
1169
+ "eval_loss": 7.559340000152588,
1170
+ "eval_map": 0.166,
1171
+ "eval_map_50": 0.2341,
1172
+ "eval_map_75": 0.1648,
1173
+ "eval_map_group": 0.1148,
1174
+ "eval_map_image": 0.2532,
1175
+ "eval_map_large": 0.338,
1176
+ "eval_map_medium": 0.2406,
1177
+ "eval_map_rectangle": 0.1871,
1178
+ "eval_map_small": 0.0849,
1179
+ "eval_map_text": 0.1089,
1180
+ "eval_mar_1": 0.0511,
1181
+ "eval_mar_10": 0.2643,
1182
+ "eval_mar_100": 0.4993,
1183
+ "eval_mar_100_group": 0.5457,
1184
+ "eval_mar_100_image": 0.6141,
1185
+ "eval_mar_100_rectangle": 0.459,
1186
+ "eval_mar_100_text": 0.3786,
1187
+ "eval_mar_large": 0.797,
1188
+ "eval_mar_medium": 0.5937,
1189
+ "eval_mar_small": 0.2892,
1190
+ "eval_runtime": 17.1914,
1191
+ "eval_samples_per_second": 6.98,
1192
+ "eval_steps_per_second": 0.873,
1193
+ "step": 1932
1194
+ },
1195
+ {
1196
+ "epoch": 23.214285714285715,
1197
+ "grad_norm": 14.862859725952148,
1198
+ "learning_rate": 1.2588183421516755e-05,
1199
+ "loss": 11.2927880859375,
1200
+ "step": 1950
1201
+ },
1202
+ {
1203
+ "epoch": 23.511904761904763,
1204
+ "grad_norm": 25.316974639892578,
1205
+ "learning_rate": 1.2037037037037037e-05,
1206
+ "loss": 10.83892822265625,
1207
+ "step": 1975
1208
+ },
1209
+ {
1210
+ "epoch": 23.80952380952381,
1211
+ "grad_norm": 12.938018798828125,
1212
+ "learning_rate": 1.148589065255732e-05,
1213
+ "loss": 10.78179443359375,
1214
+ "step": 2000
1215
+ },
1216
+ {
1217
+ "epoch": 24.0,
1218
+ "eval_loss": 7.54477071762085,
1219
+ "eval_map": 0.1581,
1220
+ "eval_map_50": 0.2225,
1221
+ "eval_map_75": 0.1557,
1222
+ "eval_map_group": 0.1103,
1223
+ "eval_map_image": 0.2517,
1224
+ "eval_map_large": 0.3262,
1225
+ "eval_map_medium": 0.2326,
1226
+ "eval_map_rectangle": 0.1766,
1227
+ "eval_map_small": 0.0781,
1228
+ "eval_map_text": 0.0938,
1229
+ "eval_mar_1": 0.0503,
1230
+ "eval_mar_10": 0.2565,
1231
+ "eval_mar_100": 0.487,
1232
+ "eval_mar_100_group": 0.5407,
1233
+ "eval_mar_100_image": 0.6067,
1234
+ "eval_mar_100_rectangle": 0.4519,
1235
+ "eval_mar_100_text": 0.3487,
1236
+ "eval_mar_large": 0.7977,
1237
+ "eval_mar_medium": 0.5912,
1238
+ "eval_mar_small": 0.2677,
1239
+ "eval_runtime": 17.1291,
1240
+ "eval_samples_per_second": 7.006,
1241
+ "eval_steps_per_second": 0.876,
1242
+ "step": 2016
1243
+ },
1244
+ {
1245
+ "epoch": 24.107142857142858,
1246
+ "grad_norm": 43.82697296142578,
1247
+ "learning_rate": 1.09347442680776e-05,
1248
+ "loss": 11.097623291015625,
1249
+ "step": 2025
1250
+ },
1251
+ {
1252
+ "epoch": 24.404761904761905,
1253
+ "grad_norm": 11.796220779418945,
1254
+ "learning_rate": 1.0383597883597884e-05,
1255
+ "loss": 11.050999755859374,
1256
+ "step": 2050
1257
+ },
1258
+ {
1259
+ "epoch": 24.702380952380953,
1260
+ "grad_norm": 11.335160255432129,
1261
+ "learning_rate": 9.832451499118166e-06,
1262
+ "loss": 10.86746337890625,
1263
+ "step": 2075
1264
+ },
1265
+ {
1266
+ "epoch": 25.0,
1267
+ "grad_norm": 18.967390060424805,
1268
+ "learning_rate": 9.281305114638448e-06,
1269
+ "loss": 11.010140380859376,
1270
+ "step": 2100
1271
+ },
1272
+ {
1273
+ "epoch": 25.0,
1274
+ "eval_loss": 7.518592357635498,
1275
+ "eval_map": 0.157,
1276
+ "eval_map_50": 0.2216,
1277
+ "eval_map_75": 0.1558,
1278
+ "eval_map_group": 0.1064,
1279
+ "eval_map_image": 0.2477,
1280
+ "eval_map_large": 0.3241,
1281
+ "eval_map_medium": 0.2348,
1282
+ "eval_map_rectangle": 0.1756,
1283
+ "eval_map_small": 0.0802,
1284
+ "eval_map_text": 0.0982,
1285
+ "eval_mar_1": 0.0505,
1286
+ "eval_mar_10": 0.2569,
1287
+ "eval_mar_100": 0.491,
1288
+ "eval_mar_100_group": 0.5458,
1289
+ "eval_mar_100_image": 0.6013,
1290
+ "eval_mar_100_rectangle": 0.4526,
1291
+ "eval_mar_100_text": 0.3644,
1292
+ "eval_mar_large": 0.7955,
1293
+ "eval_mar_medium": 0.5906,
1294
+ "eval_mar_small": 0.2748,
1295
+ "eval_runtime": 17.0932,
1296
+ "eval_samples_per_second": 7.02,
1297
+ "eval_steps_per_second": 0.878,
1298
+ "step": 2100
1299
+ },
1300
+ {
1301
+ "epoch": 25.297619047619047,
1302
+ "grad_norm": 7.750904560089111,
1303
+ "learning_rate": 8.73015873015873e-06,
1304
+ "loss": 10.79929931640625,
1305
+ "step": 2125
1306
+ },
1307
+ {
1308
+ "epoch": 25.595238095238095,
1309
+ "grad_norm": 16.77004623413086,
1310
+ "learning_rate": 8.179012345679013e-06,
1311
+ "loss": 10.849818115234376,
1312
+ "step": 2150
1313
+ },
1314
+ {
1315
+ "epoch": 25.892857142857142,
1316
+ "grad_norm": 20.175363540649414,
1317
+ "learning_rate": 7.627865961199294e-06,
1318
+ "loss": 10.97046875,
1319
+ "step": 2175
1320
+ },
1321
+ {
1322
+ "epoch": 26.0,
1323
+ "eval_loss": 7.568551063537598,
1324
+ "eval_map": 0.1583,
1325
+ "eval_map_50": 0.223,
1326
+ "eval_map_75": 0.1563,
1327
+ "eval_map_group": 0.11,
1328
+ "eval_map_image": 0.2487,
1329
+ "eval_map_large": 0.3214,
1330
+ "eval_map_medium": 0.2397,
1331
+ "eval_map_rectangle": 0.1804,
1332
+ "eval_map_small": 0.0796,
1333
+ "eval_map_text": 0.0943,
1334
+ "eval_mar_1": 0.0487,
1335
+ "eval_mar_10": 0.2593,
1336
+ "eval_mar_100": 0.4941,
1337
+ "eval_mar_100_group": 0.5395,
1338
+ "eval_mar_100_image": 0.6193,
1339
+ "eval_mar_100_rectangle": 0.4503,
1340
+ "eval_mar_100_text": 0.3673,
1341
+ "eval_mar_large": 0.7885,
1342
+ "eval_mar_medium": 0.5822,
1343
+ "eval_mar_small": 0.2876,
1344
+ "eval_runtime": 17.4348,
1345
+ "eval_samples_per_second": 6.883,
1346
+ "eval_steps_per_second": 0.86,
1347
+ "step": 2184
1348
+ },
1349
+ {
1350
+ "epoch": 26.19047619047619,
1351
+ "grad_norm": 11.11269474029541,
1352
+ "learning_rate": 7.076719576719578e-06,
1353
+ "loss": 11.78640869140625,
1354
+ "step": 2200
1355
+ },
1356
+ {
1357
+ "epoch": 26.488095238095237,
1358
+ "grad_norm": 8.43252182006836,
1359
+ "learning_rate": 6.5255731922398585e-06,
1360
+ "loss": 10.9381396484375,
1361
+ "step": 2225
1362
+ },
1363
+ {
1364
+ "epoch": 26.785714285714285,
1365
+ "grad_norm": 36.22833251953125,
1366
+ "learning_rate": 5.974426807760141e-06,
1367
+ "loss": 10.875008544921876,
1368
+ "step": 2250
1369
+ },
1370
+ {
1371
+ "epoch": 27.0,
1372
+ "eval_loss": 7.555787086486816,
1373
+ "eval_map": 0.1569,
1374
+ "eval_map_50": 0.2185,
1375
+ "eval_map_75": 0.1555,
1376
+ "eval_map_group": 0.1083,
1377
+ "eval_map_image": 0.2464,
1378
+ "eval_map_large": 0.3315,
1379
+ "eval_map_medium": 0.2371,
1380
+ "eval_map_rectangle": 0.185,
1381
+ "eval_map_small": 0.0771,
1382
+ "eval_map_text": 0.0878,
1383
+ "eval_mar_1": 0.0503,
1384
+ "eval_mar_10": 0.2538,
1385
+ "eval_mar_100": 0.4833,
1386
+ "eval_mar_100_group": 0.5389,
1387
+ "eval_mar_100_image": 0.6003,
1388
+ "eval_mar_100_rectangle": 0.4565,
1389
+ "eval_mar_100_text": 0.3373,
1390
+ "eval_mar_large": 0.8099,
1391
+ "eval_mar_medium": 0.5862,
1392
+ "eval_mar_small": 0.2609,
1393
+ "eval_runtime": 17.0991,
1394
+ "eval_samples_per_second": 7.018,
1395
+ "eval_steps_per_second": 0.877,
1396
+ "step": 2268
1397
+ },
1398
+ {
1399
+ "epoch": 27.083333333333332,
1400
+ "grad_norm": 12.785017013549805,
1401
+ "learning_rate": 5.423280423280423e-06,
1402
+ "loss": 10.976126708984374,
1403
+ "step": 2275
1404
+ },
1405
+ {
1406
+ "epoch": 27.38095238095238,
1407
+ "grad_norm": 12.107715606689453,
1408
+ "learning_rate": 4.872134038800706e-06,
1409
+ "loss": 11.2352734375,
1410
+ "step": 2300
1411
+ },
1412
+ {
1413
+ "epoch": 27.678571428571427,
1414
+ "grad_norm": 9.639913558959961,
1415
+ "learning_rate": 4.3209876543209875e-06,
1416
+ "loss": 11.119185791015624,
1417
+ "step": 2325
1418
+ },
1419
+ {
1420
+ "epoch": 27.976190476190474,
1421
+ "grad_norm": 16.351314544677734,
1422
+ "learning_rate": 3.7698412698412697e-06,
1423
+ "loss": 10.751910400390624,
1424
+ "step": 2350
1425
+ },
1426
+ {
1427
+ "epoch": 28.0,
1428
+ "eval_loss": 7.529413223266602,
1429
+ "eval_map": 0.1604,
1430
+ "eval_map_50": 0.224,
1431
+ "eval_map_75": 0.1595,
1432
+ "eval_map_group": 0.1109,
1433
+ "eval_map_image": 0.2489,
1434
+ "eval_map_large": 0.3368,
1435
+ "eval_map_medium": 0.2361,
1436
+ "eval_map_rectangle": 0.185,
1437
+ "eval_map_small": 0.0825,
1438
+ "eval_map_text": 0.0968,
1439
+ "eval_mar_1": 0.0499,
1440
+ "eval_mar_10": 0.2565,
1441
+ "eval_mar_100": 0.4946,
1442
+ "eval_mar_100_group": 0.5448,
1443
+ "eval_mar_100_image": 0.6148,
1444
+ "eval_mar_100_rectangle": 0.4581,
1445
+ "eval_mar_100_text": 0.3608,
1446
+ "eval_mar_large": 0.7961,
1447
+ "eval_mar_medium": 0.5903,
1448
+ "eval_mar_small": 0.2794,
1449
+ "eval_runtime": 16.8513,
1450
+ "eval_samples_per_second": 7.121,
1451
+ "eval_steps_per_second": 0.89,
1452
+ "step": 2352
1453
+ },
1454
+ {
1455
+ "epoch": 28.273809523809526,
1456
+ "grad_norm": 12.011247634887695,
1457
+ "learning_rate": 3.218694885361552e-06,
1458
+ "loss": 10.890947265625,
1459
+ "step": 2375
1460
+ },
1461
+ {
1462
+ "epoch": 28.571428571428573,
1463
+ "grad_norm": 11.049712181091309,
1464
+ "learning_rate": 2.667548500881834e-06,
1465
+ "loss": 11.18763427734375,
1466
+ "step": 2400
1467
+ },
1468
+ {
1469
+ "epoch": 28.86904761904762,
1470
+ "grad_norm": 16.048168182373047,
1471
+ "learning_rate": 2.1164021164021164e-06,
1472
+ "loss": 10.83516845703125,
1473
+ "step": 2425
1474
+ },
1475
+ {
1476
+ "epoch": 29.0,
1477
+ "eval_loss": 7.537722587585449,
1478
+ "eval_map": 0.1657,
1479
+ "eval_map_50": 0.2311,
1480
+ "eval_map_75": 0.1638,
1481
+ "eval_map_group": 0.1191,
1482
+ "eval_map_image": 0.2592,
1483
+ "eval_map_large": 0.3459,
1484
+ "eval_map_medium": 0.2391,
1485
+ "eval_map_rectangle": 0.1949,
1486
+ "eval_map_small": 0.0816,
1487
+ "eval_map_text": 0.0897,
1488
+ "eval_mar_1": 0.0509,
1489
+ "eval_mar_10": 0.2653,
1490
+ "eval_mar_100": 0.4975,
1491
+ "eval_mar_100_group": 0.5462,
1492
+ "eval_mar_100_image": 0.6243,
1493
+ "eval_mar_100_rectangle": 0.4592,
1494
+ "eval_mar_100_text": 0.3604,
1495
+ "eval_mar_large": 0.8001,
1496
+ "eval_mar_medium": 0.59,
1497
+ "eval_mar_small": 0.2873,
1498
+ "eval_runtime": 17.2358,
1499
+ "eval_samples_per_second": 6.962,
1500
+ "eval_steps_per_second": 0.87,
1501
+ "step": 2436
1502
+ },
1503
+ {
1504
+ "epoch": 29.166666666666668,
1505
+ "grad_norm": 11.860162734985352,
1506
+ "learning_rate": 1.5652557319223987e-06,
1507
+ "loss": 11.17228515625,
1508
+ "step": 2450
1509
+ },
1510
+ {
1511
+ "epoch": 29.464285714285715,
1512
+ "grad_norm": 17.13775062561035,
1513
+ "learning_rate": 1.0141093474426807e-06,
1514
+ "loss": 11.1133935546875,
1515
+ "step": 2475
1516
+ },
1517
+ {
1518
+ "epoch": 29.761904761904763,
1519
+ "grad_norm": 15.238182067871094,
1520
+ "learning_rate": 4.6296296296296297e-07,
1521
+ "loss": 10.7695751953125,
1522
+ "step": 2500
1523
+ },
1524
+ {
1525
+ "epoch": 30.0,
1526
+ "eval_loss": 7.532639503479004,
1527
+ "eval_map": 0.1598,
1528
+ "eval_map_50": 0.2221,
1529
+ "eval_map_75": 0.1589,
1530
+ "eval_map_group": 0.1105,
1531
+ "eval_map_image": 0.2522,
1532
+ "eval_map_large": 0.3415,
1533
+ "eval_map_medium": 0.2358,
1534
+ "eval_map_rectangle": 0.1861,
1535
+ "eval_map_small": 0.0793,
1536
+ "eval_map_text": 0.0905,
1537
+ "eval_mar_1": 0.0499,
1538
+ "eval_mar_10": 0.2576,
1539
+ "eval_mar_100": 0.4897,
1540
+ "eval_mar_100_group": 0.5388,
1541
+ "eval_mar_100_image": 0.6149,
1542
+ "eval_mar_100_rectangle": 0.4594,
1543
+ "eval_mar_100_text": 0.3458,
1544
+ "eval_mar_large": 0.8065,
1545
+ "eval_mar_medium": 0.5899,
1546
+ "eval_mar_small": 0.2705,
1547
+ "eval_runtime": 16.9062,
1548
+ "eval_samples_per_second": 7.098,
1549
+ "eval_steps_per_second": 0.887,
1550
+ "step": 2520
1551
+ },
1552
+ {
1553
+ "epoch": 30.0,
1554
+ "step": 2520,
1555
+ "total_flos": 2.95288818499584e+18,
1556
+ "train_loss": 12.287477396404933,
1557
+ "train_runtime": 1674.3599,
1558
+ "train_samples_per_second": 11.915,
1559
+ "train_steps_per_second": 1.505
1560
+ }
1561
+ ],
1562
+ "logging_steps": 25,
1563
+ "max_steps": 2520,
1564
+ "num_input_tokens_seen": 0,
1565
+ "num_train_epochs": 30,
1566
+ "save_steps": 500,
1567
+ "stateful_callbacks": {
1568
+ "TrainerControl": {
1569
+ "args": {
1570
+ "should_epoch_stop": false,
1571
+ "should_evaluate": false,
1572
+ "should_log": false,
1573
+ "should_save": true,
1574
+ "should_training_stop": true
1575
+ },
1576
+ "attributes": {}
1577
+ }
1578
+ },
1579
+ "total_flos": 2.95288818499584e+18,
1580
+ "train_batch_size": 8,
1581
+ "trial_name": null,
1582
+ "trial_params": null
1583
+ }