End of training

Browse files

Files changed (9) hide show

README.md +95 -0
config.json +174 -0
generation_config.json +13 -0
model.safetensors +3 -0
preprocessor_config.json +27 -0
runs/Dec09_09-58-26_f5a54d6e7030/events.out.tfevents.1733738333.f5a54d6e7030.547.0 +3 -0
runs/Dec09_10-02-28_f5a54d6e7030/events.out.tfevents.1733738561.f5a54d6e7030.547.1 +3 -0
runs/Dec09_10-02-28_f5a54d6e7030/events.out.tfevents.1733741470.f5a54d6e7030.547.2 +3 -0
training_args.bin +3 -0

README.md ADDED Viewed

	@@ -0,0 +1,95 @@

+---
+library_name: transformers
+language:
+- fr
+base_model: microsoft/trocr-small-handwritten
+tags:
+- generated_from_trainer
+metrics:
+- wer
+model-index:
+- name: TrOCR Small (Finetuned on French)
+  results: []
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# TrOCR Small (Finetuned on French)
+This model is a fine-tuned version of [microsoft/trocr-small-handwritten](https://huggingface.co/microsoft/trocr-small-handwritten) on the None dataset.
+It achieves the following results on the evaluation set:
+- Loss: 0.1007
+- Model Preparation Time: 0.0057
+- Cer: 0.0138
+- Wer: 0.0455
+- Ratio: 98.3979
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 1e-05
+- train_batch_size: 8
+- eval_batch_size: 8
+- seed: 42
+- optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
+- lr_scheduler_type: linear
+- training_steps: 12000
+- mixed_precision_training: Native AMP
+### Training results
+| Training Loss | Epoch  | Step  | Validation Loss | Model Preparation Time | Cer    | Wer    | Ratio   |
+|:-------------:|:------:|:-----:|:---------------:|:----------------------:|:------:|:------:|:-------:|
+| 0.1386        | 0.0333 | 400   | 0.1543          | 0.0057                 | 0.0190 | 0.0819 | 98.6922 |
+| 0.1298        | 0.0667 | 800   | 0.1300          | 0.0057                 | 0.0130 | 0.0526 | 98.9649 |
+| 0.1171        | 0.1    | 1200  | 0.1622          | 0.0057                 | 0.0200 | 0.0760 | 98.3437 |
+| 0.1035        | 0.1333 | 1600  | 0.1538          | 0.0057                 | 0.0190 | 0.0760 | 98.6841 |
+| 0.1186        | 0.1667 | 2000  | 0.1605          | 0.0057                 | 0.0170 | 0.0760 | 98.9547 |
+| 0.1285        | 0.2    | 2400  | 0.1675          | 0.0057                 | 0.0190 | 0.0643 | 98.5663 |
+| 0.1043        | 0.2333 | 2800  | 0.1511          | 0.0057                 | 0.0220 | 0.0702 | 98.4283 |
+| 0.1294        | 0.2667 | 3200  | 0.1647          | 0.0057                 | 0.0150 | 0.0526 | 98.9361 |
+| 0.0954        | 0.3    | 3600  | 0.1532          | 0.0057                 | 0.0160 | 0.0526 | 98.7555 |
+| 0.111         | 0.3333 | 4000  | 0.1577          | 0.0057                 | 0.0210 | 0.0643 | 98.1890 |
+| 0.114         | 0.3667 | 4400  | 0.1378          | 0.0057                 | 0.0160 | 0.0585 | 98.6565 |
+| 0.1183        | 0.4    | 4800  | 0.1163          | 0.0057                 | 0.0070 | 0.0351 | 99.3075 |
+| 0.1277        | 0.4333 | 5200  | 0.1571          | 0.0057                 | 0.0160 | 0.0760 | 98.8328 |
+| 0.1219        | 0.4667 | 5600  | 0.1571          | 0.0057                 | 0.0150 | 0.0526 | 98.7910 |
+| 0.1101        | 0.5    | 6000  | 0.1245          | 0.0057                 | 0.0130 | 0.0526 | 99.0524 |
+| 0.1069        | 0.5333 | 6400  | 0.1470          | 0.0057                 | 0.0130 | 0.0585 | 99.0389 |
+| 0.1126        | 0.5667 | 6800  | 0.1302          | 0.0057                 | 0.0140 | 0.0526 | 98.9437 |
+| 0.0837        | 1.0137 | 7200  | 0.1323          | 0.0057                 | 0.0200 | 0.0702 | 98.4624 |
+| 0.0809        | 1.047  | 7600  | 0.1180          | 0.0057                 | 0.0100 | 0.0409 | 99.4630 |
+| 0.0889        | 1.0803 | 8000  | 0.1241          | 0.0057                 | 0.0180 | 0.0702 | 98.7486 |
+| 0.0711        | 1.1137 | 8400  | 0.1174          | 0.0057                 | 0.0150 | 0.0585 | 98.8769 |
+| 0.0736        | 1.147  | 8800  | 0.1166          | 0.0057                 | 0.0120 | 0.0468 | 99.0708 |
+| 0.0786        | 1.1803 | 9200  | 0.1080          | 0.0057                 | 0.0080 | 0.0351 | 99.5225 |
+| 0.0686        | 1.2137 | 9600  | 0.1037          | 0.0057                 | 0.0070 | 0.0292 | 99.5887 |
+| 0.0738        | 1.2470 | 10000 | 0.1127          | 0.0057                 | 0.0140 | 0.0468 | 99.0132 |
+| 0.07          | 1.2803 | 10400 | 0.1051          | 0.0057                 | 0.0120 | 0.0409 | 99.0954 |
+| 0.0697        | 1.3137 | 10800 | 0.1003          | 0.0057                 | 0.0090 | 0.0292 | 99.2171 |
+| 0.0686        | 1.347  | 11200 | 0.1038          | 0.0057                 | 0.0120 | 0.0351 | 98.9317 |
+| 0.0763        | 1.3803 | 11600 | 0.1028          | 0.0057                 | 0.0120 | 0.0351 | 98.9317 |
+| 0.0717        | 1.4137 | 12000 | 0.1018          | 0.0057                 | 0.0120 | 0.0351 | 98.9317 |
+### Framework versions
+- Transformers 4.46.3
+- Pytorch 2.5.1+cu121
+- Datasets 3.1.0
+- Tokenizers 0.20.3

config.json ADDED Viewed

	@@ -0,0 +1,174 @@

+{
+  "_name_or_path": "/content/drive/MyDrive/Colab Notebooks/trocr/model",
+  "architectures": [
+    "VisionEncoderDecoderModel"
+  ],
+  "decoder": {
+    "_attn_implementation_autoset": false,
+    "_name_or_path": "",
+    "activation_dropout": 0.0,
+    "activation_function": "relu",
+    "add_cross_attention": true,
+    "architectures": null,
+    "attention_dropout": 0.0,
+    "bad_words_ids": null,
+    "begin_suppress_tokens": null,
+    "bos_token_id": 0,
+    "chunk_size_feed_forward": 0,
+    "classifier_dropout": 0.0,
+    "cross_attention_hidden_size": 384,
+    "d_model": 256,
+    "decoder_attention_heads": 8,
+    "decoder_ffn_dim": 1024,
+    "decoder_layerdrop": 0.0,
+    "decoder_layers": 6,
+    "decoder_start_token_id": 2,
+    "diversity_penalty": 0.0,
+    "do_sample": false,
+    "dropout": 0.1,
+    "early_stopping": false,
+    "encoder_no_repeat_ngram_size": 0,
+    "eos_token_id": 2,
+    "exponential_decay_length_penalty": null,
+    "finetuning_task": null,
+    "forced_bos_token_id": null,
+    "forced_eos_token_id": null,
+    "id2label": {
+      "0": "LABEL_0",
+      "1": "LABEL_1"
+    },
+    "init_std": 0.02,
+    "is_decoder": true,
+    "is_encoder_decoder": false,
+    "label2id": {
+      "LABEL_0": 0,
+      "LABEL_1": 1
+    },
+    "layernorm_embedding": true,
+    "length_penalty": 1.0,
+    "max_length": 20,
+    "max_position_embeddings": 512,
+    "min_length": 0,
+    "model_type": "trocr",
+    "no_repeat_ngram_size": 0,
+    "num_beam_groups": 1,
+    "num_beams": 1,
+    "num_return_sequences": 1,
+    "output_attentions": false,
+    "output_hidden_states": false,
+    "output_scores": false,
+    "pad_token_id": 1,
+    "prefix": null,
+    "problem_type": null,
+    "pruned_heads": {},
+    "remove_invalid_values": false,
+    "repetition_penalty": 1.0,
+    "return_dict": true,
+    "return_dict_in_generate": false,
+    "scale_embedding": true,
+    "sep_token_id": null,
+    "suppress_tokens": null,
+    "task_specific_params": null,
+    "temperature": 1.0,
+    "tf_legacy_loss": false,
+    "tie_encoder_decoder": false,
+    "tie_word_embeddings": false,
+    "tokenizer_class": null,
+    "top_k": 50,
+    "top_p": 1.0,
+    "torch_dtype": null,
+    "torchscript": false,
+    "typical_p": 1.0,
+    "use_bfloat16": false,
+    "use_cache": false,
+    "use_learned_position_embeddings": true,
+    "vocab_size": 64044
+  },
+  "decoder_start_token_id": 0,
+  "encoder": {
+    "_attn_implementation_autoset": false,
+    "_name_or_path": "",
+    "add_cross_attention": false,
+    "architectures": null,
+    "attention_probs_dropout_prob": 0.0,
+    "bad_words_ids": null,
+    "begin_suppress_tokens": null,
+    "bos_token_id": null,
+    "chunk_size_feed_forward": 0,
+    "cross_attention_hidden_size": null,
+    "decoder_start_token_id": null,
+    "diversity_penalty": 0.0,
+    "do_sample": false,
+    "early_stopping": false,
+    "encoder_no_repeat_ngram_size": 0,
+    "encoder_stride": 16,
+    "eos_token_id": null,
+    "exponential_decay_length_penalty": null,
+    "finetuning_task": null,
+    "forced_bos_token_id": null,
+    "forced_eos_token_id": null,
+    "hidden_act": "gelu",
+    "hidden_dropout_prob": 0.0,
+    "hidden_size": 384,
+    "id2label": {
+      "0": "LABEL_0",
+      "1": "LABEL_1"
+    },
+    "image_size": 384,
+    "initializer_range": 0.02,
+    "intermediate_size": 1536,
+    "is_decoder": false,
+    "is_encoder_decoder": false,
+    "label2id": {
+      "LABEL_0": 0,
+      "LABEL_1": 1
+    },
+    "layer_norm_eps": 1e-12,
+    "length_penalty": 1.0,
+    "max_length": 20,
+    "min_length": 0,
+    "model_type": "deit",
+    "no_repeat_ngram_size": 0,
+    "num_attention_heads": 6,
+    "num_beam_groups": 1,
+    "num_beams": 1,
+    "num_channels": 3,
+    "num_hidden_layers": 12,
+    "num_return_sequences": 1,
+    "output_attentions": false,
+    "output_hidden_states": false,
+    "output_scores": false,
+    "pad_token_id": null,
+    "patch_size": 16,
+    "prefix": null,
+    "problem_type": null,
+    "pruned_heads": {},
+    "qkv_bias": true,
+    "remove_invalid_values": false,
+    "repetition_penalty": 1.0,
+    "return_dict": true,
+    "return_dict_in_generate": false,
+    "sep_token_id": null,
+    "suppress_tokens": null,
+    "task_specific_params": null,
+    "temperature": 1.0,
+    "tf_legacy_loss": false,
+    "tie_encoder_decoder": false,
+    "tie_word_embeddings": true,
+    "tokenizer_class": null,
+    "top_k": 50,
+    "top_p": 1.0,
+    "torch_dtype": null,
+    "torchscript": false,
+    "typical_p": 1.0,
+    "use_bfloat16": false
+  },
+  "eos_token_id": 2,
+  "is_encoder_decoder": true,
+  "model_type": "vision-encoder-decoder",
+  "pad_token_id": 1,
+  "tie_word_embeddings": false,
+  "torch_dtype": "float32",
+  "transformers_version": "4.46.3",
+  "vocab_size": 64044
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "bos_token_id": 0,
+  "decoder_start_token_id": 2,
+  "early_stopping": true,
+  "eos_token_id": 2,
+  "length_penalty": 2.0,
+  "max_length": 64,
+  "no_repeat_ngram_size": 3,
+  "num_beams": 3,
+  "pad_token_id": 1,
+  "transformers_version": "4.46.3",
+  "use_cache": false
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7e0add54603bfd0d8e5783c0d9b2ea30e3c8c26a724668066240ac832f785049
+size 246430696

preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "crop_size": {
+    "height": 224,
+    "width": 224
+  },
+  "do_center_crop": false,
+  "do_normalize": true,
+  "do_rescale": true,
+  "do_resize": true,
+  "image_mean": [
+    0.5,
+    0.5,
+    0.5
+  ],
+  "image_processor_type": "DeiTImageProcessor",
+  "image_std": [
+    0.5,
+    0.5,
+    0.5
+  ],
+  "resample": 3,
+  "rescale_factor": 0.00392156862745098,
+  "size": {
+    "height": 384,
+    "width": 384
+  }
+}

runs/Dec09_09-58-26_f5a54d6e7030/events.out.tfevents.1733738333.f5a54d6e7030.547.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:08e5be000f4fc07499a3e38e8c67d7ddf5f72454da16f8c66da6ce15d6c588b9
+size 11850

runs/Dec09_10-02-28_f5a54d6e7030/events.out.tfevents.1733738561.f5a54d6e7030.547.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d2ca82c0ff69eb4c9e3d2ed9f11e2c5ca224505c0572904732778ebb8a84e887
+size 49967

runs/Dec09_10-02-28_f5a54d6e7030/events.out.tfevents.1733741470.f5a54d6e7030.547.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1634b17bb26b270a84ad0300e36a9a6483c62eae18bdf52190bb0b30ccafbf75
+size 568

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ea3a406bc35e2897b9e6805f72360ea367f6af53d083eaec29e91430121ecf39
+size 5432