vivek-dani commited on
Commit
94add1a
·
1 Parent(s): 81a4902

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -1,6 +1,5 @@
1
  {
2
- "_commit_hash": "a959cf33c20e09215873e338299c900f57047c61",
3
- "_name_or_path": "naver-clova-ix/donut-base",
4
  "architectures": [
5
  "VisionEncoderDecoderModel"
6
  ],
@@ -91,27 +90,26 @@
91
  },
92
  "decoder_start_token_id": 0,
93
  "encoder": {
94
- "_name_or_path": "",
95
  "add_cross_attention": false,
96
- "architectures": null,
 
 
97
  "attention_probs_dropout_prob": 0.0,
 
 
 
 
98
  "bad_words_ids": null,
99
  "begin_suppress_tokens": null,
100
  "bos_token_id": null,
101
  "chunk_size_feed_forward": 0,
102
  "cross_attention_hidden_size": null,
103
  "decoder_start_token_id": null,
104
- "depths": [
105
- 2,
106
- 2,
107
- 14,
108
- 2
109
- ],
110
  "diversity_penalty": 0.0,
111
  "do_sample": false,
112
  "drop_path_rate": 0.1,
113
  "early_stopping": false,
114
- "embed_dim": 128,
115
  "encoder_no_repeat_ngram_size": 0,
116
  "eos_token_id": null,
117
  "exponential_decay_length_penalty": null,
@@ -126,48 +124,55 @@
126
  "1": "LABEL_1"
127
  },
128
  "image_size": [
129
- 960,
130
- 720
131
  ],
132
  "initializer_range": 0.02,
 
133
  "is_decoder": false,
134
  "is_encoder_decoder": false,
135
  "label2id": {
136
  "LABEL_0": 0,
137
  "LABEL_1": 1
138
  },
139
- "layer_norm_eps": 1e-05,
 
140
  "length_penalty": 1.0,
141
  "max_length": 20,
142
  "min_length": 0,
143
- "mlp_ratio": 4.0,
144
- "model_type": "donut-swin",
145
  "no_repeat_ngram_size": 0,
 
146
  "num_beam_groups": 1,
147
  "num_beams": 1,
148
  "num_channels": 3,
149
- "num_heads": [
150
- 4,
151
- 8,
152
- 16,
153
- 32
154
- ],
155
- "num_layers": 4,
156
  "num_return_sequences": 1,
 
 
 
 
 
 
157
  "output_attentions": false,
158
  "output_hidden_states": false,
159
  "output_scores": false,
160
  "pad_token_id": null,
161
- "patch_size": 4,
162
- "path_norm": true,
 
 
 
 
 
163
  "prefix": null,
164
  "problem_type": null,
165
  "pruned_heads": {},
166
- "qkv_bias": true,
167
  "remove_invalid_values": false,
168
  "repetition_penalty": 1.0,
169
  "return_dict": true,
170
  "return_dict_in_generate": false,
 
171
  "sep_token_id": null,
172
  "suppress_tokens": null,
173
  "task_specific_params": null,
@@ -178,13 +183,18 @@
178
  "tokenizer_class": null,
179
  "top_k": 50,
180
  "top_p": 1.0,
181
- "torch_dtype": null,
182
  "torchscript": false,
183
  "transformers_version": "4.25.0.dev0",
184
  "typical_p": 1.0,
185
- "use_absolute_embeddings": false,
 
186
  "use_bfloat16": false,
187
- "window_size": 10
 
 
 
 
188
  },
189
  "is_encoder_decoder": true,
190
  "model_type": "vision-encoder-decoder",
 
1
  {
2
+ "_commit_hash": null,
 
3
  "architectures": [
4
  "VisionEncoderDecoderModel"
5
  ],
 
90
  },
91
  "decoder_start_token_id": 0,
92
  "encoder": {
93
+ "_name_or_path": "microsoft/dit-large",
94
  "add_cross_attention": false,
95
+ "architectures": [
96
+ "BeitForMaskedImageModeling"
97
+ ],
98
  "attention_probs_dropout_prob": 0.0,
99
+ "auxiliary_channels": 256,
100
+ "auxiliary_concat_input": false,
101
+ "auxiliary_loss_weight": 0.4,
102
+ "auxiliary_num_convs": 1,
103
  "bad_words_ids": null,
104
  "begin_suppress_tokens": null,
105
  "bos_token_id": null,
106
  "chunk_size_feed_forward": 0,
107
  "cross_attention_hidden_size": null,
108
  "decoder_start_token_id": null,
 
 
 
 
 
 
109
  "diversity_penalty": 0.0,
110
  "do_sample": false,
111
  "drop_path_rate": 0.1,
112
  "early_stopping": false,
 
113
  "encoder_no_repeat_ngram_size": 0,
114
  "eos_token_id": null,
115
  "exponential_decay_length_penalty": null,
 
124
  "1": "LABEL_1"
125
  },
126
  "image_size": [
127
+ 224,
128
+ 224
129
  ],
130
  "initializer_range": 0.02,
131
+ "intermediate_size": 4096,
132
  "is_decoder": false,
133
  "is_encoder_decoder": false,
134
  "label2id": {
135
  "LABEL_0": 0,
136
  "LABEL_1": 1
137
  },
138
+ "layer_norm_eps": 1e-12,
139
+ "layer_scale_init_value": 0.1,
140
  "length_penalty": 1.0,
141
  "max_length": 20,
142
  "min_length": 0,
143
+ "model_type": "beit",
 
144
  "no_repeat_ngram_size": 0,
145
+ "num_attention_heads": 16,
146
  "num_beam_groups": 1,
147
  "num_beams": 1,
148
  "num_channels": 3,
149
+ "num_hidden_layers": 24,
 
 
 
 
 
 
150
  "num_return_sequences": 1,
151
+ "out_indices": [
152
+ 3,
153
+ 5,
154
+ 7,
155
+ 11
156
+ ],
157
  "output_attentions": false,
158
  "output_hidden_states": false,
159
  "output_scores": false,
160
  "pad_token_id": null,
161
+ "patch_size": 16,
162
+ "pool_scales": [
163
+ 1,
164
+ 2,
165
+ 3,
166
+ 6
167
+ ],
168
  "prefix": null,
169
  "problem_type": null,
170
  "pruned_heads": {},
 
171
  "remove_invalid_values": false,
172
  "repetition_penalty": 1.0,
173
  "return_dict": true,
174
  "return_dict_in_generate": false,
175
+ "semantic_loss_ignore_index": 255,
176
  "sep_token_id": null,
177
  "suppress_tokens": null,
178
  "task_specific_params": null,
 
183
  "tokenizer_class": null,
184
  "top_k": 50,
185
  "top_p": 1.0,
186
+ "torch_dtype": "float32",
187
  "torchscript": false,
188
  "transformers_version": "4.25.0.dev0",
189
  "typical_p": 1.0,
190
+ "use_absolute_position_embeddings": true,
191
+ "use_auxiliary_head": true,
192
  "use_bfloat16": false,
193
+ "use_mask_token": true,
194
+ "use_mean_pooling": true,
195
+ "use_relative_position_bias": false,
196
+ "use_shared_relative_position_bias": false,
197
+ "vocab_size": 8192
198
  },
199
  "is_encoder_decoder": true,
200
  "model_type": "vision-encoder-decoder",
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a12ffd3f922819c10c8ccac60968c5c0f678297dfb55185ffe2c6ea589bc613
3
- size 809181691
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:719c994e0d5d21a92add2f2793cb4ac4188ca7b32910b27213d5f70997b78a85
3
+ size 1724178702
runs/Dec05_07-07-43_vidani1/1670224272.8914764/events.out.tfevents.1670224272.vidani1.13838.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64330d43196ac2d2ba10a7635fde4247128ea4909b4a0bd2473ff3d3a356f674
3
+ size 5702
runs/Dec05_07-07-43_vidani1/events.out.tfevents.1670224272.vidani1.13838.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:892dc7694bf97e72d406a70090dc14ad11f3d7711b31aa5b61c2f724051698a6
3
+ size 8480
runs/Dec05_07-16-06_vidani1/1670224578.67999/events.out.tfevents.1670224578.vidani1.2893.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79212da24a403472b0cd848129e205123cff73056db19ce45977ebca6c10ef7b
3
+ size 5702
runs/Dec05_07-16-06_vidani1/events.out.tfevents.1670224578.vidani1.2893.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38ea89999eb28c95738760d75dbc14d6aa41dc14054ffaa29ae2a83e9479af3f
3
+ size 8480
runs/Dec05_07-51-46_vidani1/1670226717.1223223/events.out.tfevents.1670226717.vidani1.13119.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:576950f5e52efa9dfe3e7ccdbd6faf5be0e7bcdc8523d52ad77023941912230a
3
+ size 5702
runs/Dec05_07-51-46_vidani1/events.out.tfevents.1670226717.vidani1.13119.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40b525cf77d43aebd6e5ae197f64cc4b8f9a6625163c857360d337b025fec678
3
+ size 8480
runs/Dec05_07-56-25_vidani1/1670226993.9422476/events.out.tfevents.1670226993.vidani1.13119.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:510268d95730db74eab6a4bf6efbe1063b52e6cbe277d128265de85a021c12a9
3
+ size 5702
runs/Dec05_07-56-25_vidani1/events.out.tfevents.1670226993.vidani1.13119.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c5207710d1995b0739abf30db4164a8061a1e852bff57a6f6df43d41568a0be
3
+ size 8480
runs/Dec05_08-00-03_vidani1/1670227214.9180048/events.out.tfevents.1670227214.vidani1.32400.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad88f7ff0b3e8fca24473770e7791e367154fcca078ef35c7c3ab715d679365a
3
+ size 5702
runs/Dec05_08-00-03_vidani1/events.out.tfevents.1670227214.vidani1.32400.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f12ba7cefc9a8991328973e728e51ac86696d2ddd35d53cae62e3b5c00de04ec
3
+ size 8479
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ef3a018de8ac98506192b15649328bdd91c9df6ddd83057cba7c61ff2f381ea
3
  size 3567
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61f25a751b6e638a739a6c3292bc56fe0fb9c66b5974c11fe2ca9b72ef90f005
3
  size 3567