Model with accuracy: 0.8381
Browse files- README.md +0 -1
- config.json +4 -1
README.md
CHANGED
|
@@ -1,4 +1,3 @@
|
|
| 1 |
-
|
| 2 |
---
|
| 3 |
language: en
|
| 4 |
tags:
|
|
|
|
|
|
|
| 1 |
---
|
| 2 |
language: en
|
| 3 |
tags:
|
config.json
CHANGED
|
@@ -1,4 +1,5 @@
|
|
| 1 |
{
|
|
|
|
| 2 |
"architectures": [
|
| 3 |
"VisionEncoderDecoderModel"
|
| 4 |
],
|
|
@@ -85,8 +86,9 @@
|
|
| 85 |
"typical_p": 1.0,
|
| 86 |
"use_bfloat16": false,
|
| 87 |
"use_cache": true,
|
| 88 |
-
"vocab_size":
|
| 89 |
},
|
|
|
|
| 90 |
"encoder": {
|
| 91 |
"_attn_implementation_autoset": false,
|
| 92 |
"_name_or_path": "",
|
|
@@ -185,6 +187,7 @@
|
|
| 185 |
},
|
| 186 |
"is_encoder_decoder": true,
|
| 187 |
"model_type": "vision-encoder-decoder",
|
|
|
|
| 188 |
"tie_word_embeddings": false,
|
| 189 |
"torch_dtype": "float32",
|
| 190 |
"transformers_version": "4.49.0.dev0"
|
|
|
|
| 1 |
{
|
| 2 |
+
"_name_or_path": "naver-clova-ix/donut-base",
|
| 3 |
"architectures": [
|
| 4 |
"VisionEncoderDecoderModel"
|
| 5 |
],
|
|
|
|
| 86 |
"typical_p": 1.0,
|
| 87 |
"use_bfloat16": false,
|
| 88 |
"use_cache": true,
|
| 89 |
+
"vocab_size": 57534
|
| 90 |
},
|
| 91 |
+
"decoder_start_token_id": 57533,
|
| 92 |
"encoder": {
|
| 93 |
"_attn_implementation_autoset": false,
|
| 94 |
"_name_or_path": "",
|
|
|
|
| 187 |
},
|
| 188 |
"is_encoder_decoder": true,
|
| 189 |
"model_type": "vision-encoder-decoder",
|
| 190 |
+
"pad_token_id": 1,
|
| 191 |
"tie_word_embeddings": false,
|
| 192 |
"torch_dtype": "float32",
|
| 193 |
"transformers_version": "4.49.0.dev0"
|