Upload folder using huggingface_hub

Browse files

Files changed (14) hide show

.gitattributes +6 -0
best_accuracy.pdopt +3 -0
best_accuracy/metric.states +0 -0
best_accuracy/model_config.json +45 -0
best_accuracy/model_state.pdparams +3 -0
best_model/model.pdopt +3 -0
best_model/model_config.json +45 -0
best_model/model_state.pdparams +3 -0
config.yml +161 -0
latest.pdopt +3 -0
latest/metric.states +0 -0
latest/model_config.json +45 -0
latest/model_state.pdparams +3 -0
train.log +0 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,9 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+best_accuracy/model_state.pdparams filter=lfs diff=lfs merge=lfs -text
+best_accuracy.pdopt filter=lfs diff=lfs merge=lfs -text
+best_model/model.pdopt filter=lfs diff=lfs merge=lfs -text
+best_model/model_state.pdparams filter=lfs diff=lfs merge=lfs -text
+latest/model_state.pdparams filter=lfs diff=lfs merge=lfs -text
+latest.pdopt filter=lfs diff=lfs merge=lfs -text

best_accuracy.pdopt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3e0d10ed58c0f46f4e5b76ff2648146636ce057ba838e95bd18a23d011da2ea0
+size 2224406688

best_accuracy/metric.states ADDED Viewed

Binary file (384 Bytes). View file

best_accuracy/model_config.json ADDED Viewed

	@@ -0,0 +1,45 @@

+{
+  "num_classes": 79,
+  "dropout": null,
+  "init_args": [
+    {
+      "attention_probs_dropout_prob": 0.1,
+      "bos_token_id": 0,
+      "coordinate_size": 128,
+      "eos_token_id": 2,
+      "fast_qkv": false,
+      "gradient_checkpointing": false,
+      "has_relative_attention_bias": false,
+      "has_spatial_attention_bias": false,
+      "has_visual_segment_embedding": true,
+      "use_visual_backbone": false,
+      "hidden_act": "gelu",
+      "hidden_dropout_prob": 0.1,
+      "hidden_size": 768,
+      "image_feature_pool_shape": [
+        7,
+        7,
+        256
+      ],
+      "initializer_range": 0.02,
+      "intermediate_size": 3072,
+      "layer_norm_eps": 1e-05,
+      "max_2d_position_embeddings": 1024,
+      "max_position_embeddings": 514,
+      "max_rel_2d_pos": 256,
+      "max_rel_pos": 128,
+      "model_type": "layoutlmv2",
+      "num_attention_heads": 12,
+      "num_hidden_layers": 12,
+      "output_past": true,
+      "pad_token_id": 1,
+      "shape_size": 128,
+      "rel_2d_pos_bins": 64,
+      "rel_pos_bins": 32,
+      "type_vocab_size": 1,
+      "vocab_size": 250002,
+      "init_class": "LayoutXLMModel"
+    }
+  ],
+  "init_class": "LayoutXLMForTokenClassification"
+}

best_accuracy/model_state.pdparams ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bc2883904bf8874460c2771be1fd97a9d45950b770216d8ebf18a21a79da1832
+size 1114551884

best_model/model.pdopt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3e0d10ed58c0f46f4e5b76ff2648146636ce057ba838e95bd18a23d011da2ea0
+size 2224406688

best_model/model_config.json ADDED Viewed

	@@ -0,0 +1,45 @@

+{
+  "num_classes": 79,
+  "dropout": null,
+  "init_args": [
+    {
+      "attention_probs_dropout_prob": 0.1,
+      "bos_token_id": 0,
+      "coordinate_size": 128,
+      "eos_token_id": 2,
+      "fast_qkv": false,
+      "gradient_checkpointing": false,
+      "has_relative_attention_bias": false,
+      "has_spatial_attention_bias": false,
+      "has_visual_segment_embedding": true,
+      "use_visual_backbone": false,
+      "hidden_act": "gelu",
+      "hidden_dropout_prob": 0.1,
+      "hidden_size": 768,
+      "image_feature_pool_shape": [
+        7,
+        7,
+        256
+      ],
+      "initializer_range": 0.02,
+      "intermediate_size": 3072,
+      "layer_norm_eps": 1e-05,
+      "max_2d_position_embeddings": 1024,
+      "max_position_embeddings": 514,
+      "max_rel_2d_pos": 256,
+      "max_rel_pos": 128,
+      "model_type": "layoutlmv2",
+      "num_attention_heads": 12,
+      "num_hidden_layers": 12,
+      "output_past": true,
+      "pad_token_id": 1,
+      "shape_size": 128,
+      "rel_2d_pos_bins": 64,
+      "rel_pos_bins": 32,
+      "type_vocab_size": 1,
+      "vocab_size": 250002,
+      "init_class": "LayoutXLMModel"
+    }
+  ],
+  "init_class": "LayoutXLMForTokenClassification"
+}

best_model/model_state.pdparams ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bc2883904bf8874460c2771be1fd97a9d45950b770216d8ebf18a21a79da1832
+size 1114551884

config.yml ADDED Viewed

	@@ -0,0 +1,161 @@

+Global:
+  use_gpu: true
+  epoch_num: 200
+  log_smooth_window: 10
+  print_batch_step: 10
+  save_model_dir: ./output/ser_vi_layoutxlm_xfund_zh
+  save_epoch_step: 2000
+  eval_batch_step:
+  - 0
+  - 19
+  cal_metric_during_train: false
+  save_inference_dir: null
+  use_visualdl: false
+  seed: 2022
+  infer_img: ppstructure/docs/kie/input/zh_val_42.jpg
+  d2s_train_image_shape:
+  - 3
+  - 224
+  - 224
+  save_res_path: /content/PaddleOCR/output/ser_layoutxlm_xfund_zh/res
+  kie_rec_model_dir: null
+  kie_det_model_dir: null
+  amp_custom_white_list:
+  - scale
+  - concat
+  - elementwise_add
+Architecture:
+  model_type: kie
+  algorithm: LayoutXLM
+  Transform: null
+  Backbone:
+    name: LayoutXLMForSer
+    pretrained: true
+    checkpoints: null
+    mode: vi
+    num_classes: 79
+Loss:
+  name: VQASerTokenLayoutLMLoss
+  num_classes: 79
+  key: backbone_out
+Optimizer:
+  name: AdamW
+  beta1: 0.9
+  beta2: 0.999
+  lr:
+    name: Linear
+    learning_rate: 5.0e-05
+    epochs: 200
+    warmup_epoch: 2
+  regularizer:
+    name: L2
+    factor: 0.0
+PostProcess:
+  name: VQASerTokenLayoutLMPostProcess
+  class_path: /content/PaddleOCR/dataset/class_list_jmfunsd.txt
+Metric:
+  name: VQASerTokenMetric
+  main_indicator: hmean
+Train:
+  dataset:
+    name: SimpleDataSet
+    data_dir: /content/PaddleOCR/dataset/training_data/images
+    label_file_list:
+    - /content/PaddleOCR/dataset/train.json
+    ratio_list:
+    - 1.0
+    transforms:
+    - DecodeImage:
+        img_mode: RGB
+        channel_first: false
+    - VQATokenLabelEncode:
+        contains_re: false
+        algorithm: LayoutXLM
+        class_path: /content/PaddleOCR/dataset/class_list_jmfunsd.txt
+        use_textline_bbox_info: true
+        order_method: tb-yx
+    - VQATokenPad:
+        max_seq_len: 512
+        return_attention_mask: true
+    - VQASerTokenChunk:
+        max_seq_len: 512
+    - Resize:
+        size:
+        - 224
+        - 224
+    - NormalizeImage:
+        scale: 1
+        mean:
+        - 123.675
+        - 116.28
+        - 103.53
+        std:
+        - 58.395
+        - 57.12
+        - 57.375
+        order: hwc
+    - ToCHWImage: null
+    - KeepKeys:
+        keep_keys:
+        - input_ids
+        - bbox
+        - attention_mask
+        - token_type_ids
+        - image
+        - labels
+  loader:
+    shuffle: true
+    drop_last: false
+    batch_size_per_card: 8
+    num_workers: 4
+Eval:
+  dataset:
+    name: SimpleDataSet
+    data_dir: /content/PaddleOCR/dataset/testing_data/images
+    label_file_list:
+    - /content/PaddleOCR/dataset/test.json
+    transforms:
+    - DecodeImage:
+        img_mode: RGB
+        channel_first: false
+    - VQATokenLabelEncode:
+        contains_re: false
+        algorithm: LayoutXLM
+        class_path: /content/PaddleOCR/dataset/class_list_jmfunsd.txt
+        use_textline_bbox_info: true
+        order_method: tb-yx
+    - VQATokenPad:
+        max_seq_len: 512
+        return_attention_mask: true
+    - VQASerTokenChunk:
+        max_seq_len: 512
+    - Resize:
+        size:
+        - 224
+        - 224
+    - NormalizeImage:
+        scale: 1
+        mean:
+        - 123.675
+        - 116.28
+        - 103.53
+        std:
+        - 58.395
+        - 57.12
+        - 57.375
+        order: hwc
+    - ToCHWImage: null
+    - KeepKeys:
+        keep_keys:
+        - input_ids
+        - bbox
+        - attention_mask
+        - token_type_ids
+        - image
+        - labels
+  loader:
+    shuffle: false
+    drop_last: false
+    batch_size_per_card: 8
+    num_workers: 4
+profiler_options: null

latest.pdopt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:521df5a5ebcf90aa3402b2370452cce35023c6381d7e92fed9b99e1942462e6a
+size 2224406688

latest/metric.states ADDED Viewed

Binary file (384 Bytes). View file

latest/model_config.json ADDED Viewed

	@@ -0,0 +1,45 @@

+{
+  "num_classes": 79,
+  "dropout": null,
+  "init_args": [
+    {
+      "attention_probs_dropout_prob": 0.1,
+      "bos_token_id": 0,
+      "coordinate_size": 128,
+      "eos_token_id": 2,
+      "fast_qkv": false,
+      "gradient_checkpointing": false,
+      "has_relative_attention_bias": false,
+      "has_spatial_attention_bias": false,
+      "has_visual_segment_embedding": true,
+      "use_visual_backbone": false,
+      "hidden_act": "gelu",
+      "hidden_dropout_prob": 0.1,
+      "hidden_size": 768,
+      "image_feature_pool_shape": [
+        7,
+        7,
+        256
+      ],
+      "initializer_range": 0.02,
+      "intermediate_size": 3072,
+      "layer_norm_eps": 1e-05,
+      "max_2d_position_embeddings": 1024,
+      "max_position_embeddings": 514,
+      "max_rel_2d_pos": 256,
+      "max_rel_pos": 128,
+      "model_type": "layoutlmv2",
+      "num_attention_heads": 12,
+      "num_hidden_layers": 12,
+      "output_past": true,
+      "pad_token_id": 1,
+      "shape_size": 128,
+      "rel_2d_pos_bins": 64,
+      "rel_pos_bins": 32,
+      "type_vocab_size": 1,
+      "vocab_size": 250002,
+      "init_class": "LayoutXLMModel"
+    }
+  ],
+  "init_class": "LayoutXLMForTokenClassification"
+}

latest/model_state.pdparams ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:25a3c91294ea276505641f8f223f66e6006e8860ee50715b1d16d977bedb799c
+size 1114551884

train.log ADDED Viewed

The diff for this file is too large to render. See raw diff