AlienKevin commited on
Commit
7311592
·
1 Parent(s): 618458e

Delete checkpoint-180

Browse files
checkpoint-180/config.json DELETED
@@ -1,180 +0,0 @@
1
- {
2
- "_commit_hash": "c8ec879716f6b8c2d782c3bd88686a5bec37102d",
3
- "_name_or_path": "microsoft/trocr-base-stage1",
4
- "architectures": [
5
- "VisionEncoderDecoderModel"
6
- ],
7
- "decoder": {
8
- "_name_or_path": "",
9
- "activation_dropout": 0.0,
10
- "activation_function": "relu",
11
- "add_cross_attention": true,
12
- "architectures": null,
13
- "attention_dropout": 0.0,
14
- "bad_words_ids": null,
15
- "begin_suppress_tokens": null,
16
- "bos_token_id": 0,
17
- "chunk_size_feed_forward": 0,
18
- "classifier_dropout": 0.0,
19
- "cross_attention_hidden_size": 768,
20
- "d_model": 1024,
21
- "decoder_attention_heads": 16,
22
- "decoder_ffn_dim": 4096,
23
- "decoder_layerdrop": 0.0,
24
- "decoder_layers": 12,
25
- "decoder_start_token_id": 2,
26
- "diversity_penalty": 0.0,
27
- "do_sample": false,
28
- "dropout": 0.1,
29
- "early_stopping": false,
30
- "encoder_no_repeat_ngram_size": 0,
31
- "eos_token_id": 2,
32
- "exponential_decay_length_penalty": null,
33
- "finetuning_task": null,
34
- "forced_bos_token_id": null,
35
- "forced_eos_token_id": null,
36
- "id2label": {
37
- "0": "LABEL_0",
38
- "1": "LABEL_1"
39
- },
40
- "init_std": 0.02,
41
- "is_decoder": true,
42
- "is_encoder_decoder": false,
43
- "label2id": {
44
- "LABEL_0": 0,
45
- "LABEL_1": 1
46
- },
47
- "layernorm_embedding": false,
48
- "length_penalty": 1.0,
49
- "max_length": 20,
50
- "max_position_embeddings": 1024,
51
- "min_length": 0,
52
- "model_type": "trocr",
53
- "no_repeat_ngram_size": 0,
54
- "num_beam_groups": 1,
55
- "num_beams": 1,
56
- "num_return_sequences": 1,
57
- "output_attentions": false,
58
- "output_hidden_states": false,
59
- "output_scores": false,
60
- "pad_token_id": 1,
61
- "prefix": null,
62
- "problem_type": null,
63
- "pruned_heads": {},
64
- "remove_invalid_values": false,
65
- "repetition_penalty": 1.0,
66
- "return_dict": true,
67
- "return_dict_in_generate": false,
68
- "scale_embedding": true,
69
- "sep_token_id": null,
70
- "suppress_tokens": null,
71
- "task_specific_params": null,
72
- "temperature": 1.0,
73
- "tf_legacy_loss": false,
74
- "tie_encoder_decoder": false,
75
- "tie_word_embeddings": false,
76
- "tokenizer_class": null,
77
- "top_k": 50,
78
- "top_p": 1.0,
79
- "torch_dtype": null,
80
- "torchscript": false,
81
- "transformers_version": "4.27.4",
82
- "typical_p": 1.0,
83
- "use_bfloat16": false,
84
- "use_cache": false,
85
- "use_learned_position_embeddings": false,
86
- "vocab_size": 50265
87
- },
88
- "decoder_start_token_id": 0,
89
- "early_stopping": true,
90
- "encoder": {
91
- "_name_or_path": "",
92
- "add_cross_attention": false,
93
- "architectures": null,
94
- "attention_probs_dropout_prob": 0.0,
95
- "bad_words_ids": null,
96
- "begin_suppress_tokens": null,
97
- "bos_token_id": null,
98
- "chunk_size_feed_forward": 0,
99
- "cross_attention_hidden_size": null,
100
- "decoder_start_token_id": null,
101
- "diversity_penalty": 0.0,
102
- "do_sample": false,
103
- "early_stopping": false,
104
- "encoder_no_repeat_ngram_size": 0,
105
- "encoder_stride": 16,
106
- "eos_token_id": null,
107
- "exponential_decay_length_penalty": null,
108
- "finetuning_task": null,
109
- "forced_bos_token_id": null,
110
- "forced_eos_token_id": null,
111
- "hidden_act": "gelu",
112
- "hidden_dropout_prob": 0.0,
113
- "hidden_size": 768,
114
- "id2label": {
115
- "0": "LABEL_0",
116
- "1": "LABEL_1"
117
- },
118
- "image_size": 384,
119
- "initializer_range": 0.02,
120
- "intermediate_size": 3072,
121
- "is_decoder": false,
122
- "is_encoder_decoder": false,
123
- "label2id": {
124
- "LABEL_0": 0,
125
- "LABEL_1": 1
126
- },
127
- "layer_norm_eps": 1e-12,
128
- "length_penalty": 1.0,
129
- "max_length": 20,
130
- "min_length": 0,
131
- "model_type": "vit",
132
- "no_repeat_ngram_size": 0,
133
- "num_attention_heads": 12,
134
- "num_beam_groups": 1,
135
- "num_beams": 1,
136
- "num_channels": 3,
137
- "num_hidden_layers": 12,
138
- "num_return_sequences": 1,
139
- "output_attentions": false,
140
- "output_hidden_states": false,
141
- "output_scores": false,
142
- "pad_token_id": null,
143
- "patch_size": 16,
144
- "prefix": null,
145
- "problem_type": null,
146
- "pruned_heads": {},
147
- "qkv_bias": false,
148
- "remove_invalid_values": false,
149
- "repetition_penalty": 1.0,
150
- "return_dict": true,
151
- "return_dict_in_generate": false,
152
- "sep_token_id": null,
153
- "suppress_tokens": null,
154
- "task_specific_params": null,
155
- "temperature": 1.0,
156
- "tf_legacy_loss": false,
157
- "tie_encoder_decoder": false,
158
- "tie_word_embeddings": true,
159
- "tokenizer_class": null,
160
- "top_k": 50,
161
- "top_p": 1.0,
162
- "torch_dtype": null,
163
- "torchscript": false,
164
- "transformers_version": "4.27.4",
165
- "typical_p": 1.0,
166
- "use_bfloat16": false
167
- },
168
- "eos_token_id": 2,
169
- "is_encoder_decoder": true,
170
- "length_penalty": 2.0,
171
- "max_length": 25,
172
- "model_type": "vision-encoder-decoder",
173
- "no_repeat_ngram_size": 3,
174
- "num_beams": 4,
175
- "pad_token_id": 1,
176
- "tie_word_embeddings": false,
177
- "torch_dtype": "float32",
178
- "transformers_version": null,
179
- "vocab_size": 50265
180
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-180/generation_config.json DELETED
@@ -1,13 +0,0 @@
1
- {
2
- "bos_token_id": 0,
3
- "decoder_start_token_id": 0,
4
- "early_stopping": true,
5
- "eos_token_id": 2,
6
- "length_penalty": 2.0,
7
- "max_length": 25,
8
- "no_repeat_ngram_size": 3,
9
- "num_beams": 4,
10
- "pad_token_id": 1,
11
- "transformers_version": "4.27.4",
12
- "use_cache": false
13
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-180/optimizer.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:0dc419dab2072c86ba7db4c4e8bfffe1adfae4efd6893041ec1d22f39e831ce0
3
- size 3074459717
 
 
 
 
checkpoint-180/preprocessor_config.json DELETED
@@ -1,22 +0,0 @@
1
- {
2
- "do_normalize": true,
3
- "do_rescale": true,
4
- "do_resize": true,
5
- "image_mean": [
6
- 0.5,
7
- 0.5,
8
- 0.5
9
- ],
10
- "image_processor_type": "ViTImageProcessor",
11
- "image_std": [
12
- 0.5,
13
- 0.5,
14
- 0.5
15
- ],
16
- "resample": 2,
17
- "rescale_factor": 0.00392156862745098,
18
- "size": {
19
- "height": 384,
20
- "width": 384
21
- }
22
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-180/pytorch_model.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:76ad2f81fe629f870a1d44be06b058c4fb284eda95ab6d79c090e77135c97c68
3
- size 1539618953
 
 
 
 
checkpoint-180/rng_state.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:f91f5d4545cc6b436bf40d8b2200ffd99059ad78783ce772d08997ced40541b7
3
- size 13553
 
 
 
 
checkpoint-180/scheduler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:93370859a32524141e70ecd87308ad7517dad70e01d91f181fb43bdf428001ca
3
- size 627
 
 
 
 
checkpoint-180/trainer_state.json DELETED
@@ -1,178 +0,0 @@
1
- {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 2.8125,
5
- "global_step": 180,
6
- "is_hyper_param_search": false,
7
- "is_local_process_zero": true,
8
- "is_world_process_zero": true,
9
- "log_history": [
10
- {
11
- "epoch": 0.16,
12
- "learning_rate": 4.739583333333333e-05,
13
- "loss": 0.2329,
14
- "step": 10
15
- },
16
- {
17
- "epoch": 0.31,
18
- "learning_rate": 4.4791666666666673e-05,
19
- "loss": 0.0657,
20
- "step": 20
21
- },
22
- {
23
- "epoch": 0.47,
24
- "learning_rate": 4.21875e-05,
25
- "loss": 0.0442,
26
- "step": 30
27
- },
28
- {
29
- "epoch": 0.47,
30
- "eval_cer": 0.09341614906832298,
31
- "eval_loss": 0.03504600375890732,
32
- "eval_runtime": 433.0095,
33
- "eval_samples_per_second": 1.18,
34
- "eval_steps_per_second": 0.037,
35
- "step": 30
36
- },
37
- {
38
- "epoch": 0.62,
39
- "learning_rate": 3.958333333333333e-05,
40
- "loss": 0.0327,
41
- "step": 40
42
- },
43
- {
44
- "epoch": 0.78,
45
- "learning_rate": 3.697916666666667e-05,
46
- "loss": 0.0316,
47
- "step": 50
48
- },
49
- {
50
- "epoch": 0.94,
51
- "learning_rate": 3.4375e-05,
52
- "loss": 0.0242,
53
- "step": 60
54
- },
55
- {
56
- "epoch": 0.94,
57
- "eval_cer": 0.02981366459627329,
58
- "eval_loss": 0.02102348767220974,
59
- "eval_runtime": 445.6571,
60
- "eval_samples_per_second": 1.147,
61
- "eval_steps_per_second": 0.036,
62
- "step": 60
63
- },
64
- {
65
- "epoch": 1.09,
66
- "learning_rate": 3.177083333333333e-05,
67
- "loss": 0.0252,
68
- "step": 70
69
- },
70
- {
71
- "epoch": 1.25,
72
- "learning_rate": 2.916666666666667e-05,
73
- "loss": 0.0208,
74
- "step": 80
75
- },
76
- {
77
- "epoch": 1.41,
78
- "learning_rate": 2.6562500000000002e-05,
79
- "loss": 0.0203,
80
- "step": 90
81
- },
82
- {
83
- "epoch": 1.41,
84
- "eval_cer": 0.01937888198757764,
85
- "eval_loss": 0.018760638311505318,
86
- "eval_runtime": 489.631,
87
- "eval_samples_per_second": 1.044,
88
- "eval_steps_per_second": 0.033,
89
- "step": 90
90
- },
91
- {
92
- "epoch": 1.56,
93
- "learning_rate": 2.3958333333333334e-05,
94
- "loss": 0.02,
95
- "step": 100
96
- },
97
- {
98
- "epoch": 1.72,
99
- "learning_rate": 2.1354166666666666e-05,
100
- "loss": 0.0178,
101
- "step": 110
102
- },
103
- {
104
- "epoch": 1.88,
105
- "learning_rate": 1.8750000000000002e-05,
106
- "loss": 0.0169,
107
- "step": 120
108
- },
109
- {
110
- "epoch": 1.88,
111
- "eval_cer": 0.010186335403726708,
112
- "eval_loss": 0.01577191799879074,
113
- "eval_runtime": 572.6491,
114
- "eval_samples_per_second": 0.892,
115
- "eval_steps_per_second": 0.028,
116
- "step": 120
117
- },
118
- {
119
- "epoch": 2.03,
120
- "learning_rate": 1.6145833333333334e-05,
121
- "loss": 0.0161,
122
- "step": 130
123
- },
124
- {
125
- "epoch": 2.19,
126
- "learning_rate": 1.3541666666666666e-05,
127
- "loss": 0.0151,
128
- "step": 140
129
- },
130
- {
131
- "epoch": 2.34,
132
- "learning_rate": 1.09375e-05,
133
- "loss": 0.0151,
134
- "step": 150
135
- },
136
- {
137
- "epoch": 2.34,
138
- "eval_cer": 0.0084472049689441,
139
- "eval_loss": 0.014565763995051384,
140
- "eval_runtime": 618.7531,
141
- "eval_samples_per_second": 0.826,
142
- "eval_steps_per_second": 0.026,
143
- "step": 150
144
- },
145
- {
146
- "epoch": 2.5,
147
- "learning_rate": 8.333333333333334e-06,
148
- "loss": 0.015,
149
- "step": 160
150
- },
151
- {
152
- "epoch": 2.66,
153
- "learning_rate": 5.729166666666667e-06,
154
- "loss": 0.0139,
155
- "step": 170
156
- },
157
- {
158
- "epoch": 2.81,
159
- "learning_rate": 3.125e-06,
160
- "loss": 0.0133,
161
- "step": 180
162
- },
163
- {
164
- "epoch": 2.81,
165
- "eval_cer": 0.007950310559006211,
166
- "eval_loss": 0.014070576056838036,
167
- "eval_runtime": 564.3264,
168
- "eval_samples_per_second": 0.906,
169
- "eval_steps_per_second": 0.028,
170
- "step": 180
171
- }
172
- ],
173
- "max_steps": 192,
174
- "num_train_epochs": 3,
175
- "total_flos": 5.084609259497325e+18,
176
- "trial_name": null,
177
- "trial_params": null
178
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-180/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:13731dc01b37599b9b0f3d5fd0906ad0d86914ef40c4ea694dddf1b5ccc9e924
3
- size 3643