| project: vietocr_new
|
| name: Train
|
|
|
| device: cuda:0
|
|
|
|
|
| vocab: 'aAàÀảẢãÃáÁạẠăĂằẰẳẲẵẴắẮặẶâÂầẦẩẨẫẪấẤậẬbBcCdDđĐeEèÈẻẺẽẼéÉẹẸêÊềỀểỂễỄếẾệỆfFgGhHiIìÌỉỈĩĨíÍịỊjJkKlLmMnNoOòÒỏỎõÕóÓọỌôÔồỒổỔỗỖốỐộỘơƠờỜởỞỡỠớỚợỢpPqQrRsStTuUùÙủỦũŨúÚụỤưƯừỪửỬữỮứỨựỰvVwWxXyYỳỲỷỶỹỸýÝỵỴzZ0123456789!"#$%&''()*+,-./:;<=>?@[\]^_`{|}~ '
|
|
|
| seq_modeling: seq2seq
|
| transformer:
|
| encoder_hidden: 256
|
| decoder_hidden: 256
|
| img_channel: 256
|
| decoder_embedded: 256
|
| dropout: 0.1
|
|
|
| optimizer:
|
| max_lr: 0.001
|
| pct_start: 0.1
|
|
|
| trainer:
|
| batch_size: 128
|
| print_every: 100
|
| valid_every: 500
|
| test_every: 500
|
| iters: 10000
|
|
|
| export: weights/train_model.pth
|
| checkpoint: ./checkpoint/checkpoint_model.pth
|
| log: ./train.log
|
|
|
| metrics: 49228
|
| test_metrics: 28918
|
| pretrained: false
|
|
|
| dataset:
|
|
|
| data_root: /mnt/disk3/CGGANv2
|
|
|
| train_annotation: datasets/labels/train.txt
|
| valid_annotation: datasets/labels/valid.txt
|
| test_annotation: datasets/labels/test.txt
|
|
|
| train_lmdb: datasets/lmdb/train
|
| valid_lmdb: datasets/lmdb/valid
|
| test_lmdb: datasets/lmdb/test
|
|
|
|
|
| image_height: 32
|
| image_min_width: 32
|
| image_max_width: 512
|
|
|
| dataloader:
|
| num_workers: 12
|
| pin_memory: true
|
|
|
| aug:
|
| image_aug: false
|
| masked_language_model: false
|
|
|
| predictor:
|
|
|
| beamsearch: false
|
|
|
| quiet: false
|
|
|
|
|
| pretrain: https://vocr.vn/data/vietocr/vgg_seq2seq.pth
|
|
|
|
|
| weights: https://vocr.vn/data/vietocr/vgg_seq2seq.pth
|
|
|
| backbone: vgg19_bn
|
| cnn:
|
|
|
| ss:
|
| - [2, 2]
|
| - [2, 2]
|
| - [2, 1]
|
| - [2, 1]
|
| - [1, 1]
|
|
|
| ks:
|
| - [2, 2]
|
| - [2, 2]
|
| - [2, 1]
|
| - [2, 1]
|
| - [1, 1]
|
|
|
| hidden: 256
|
|
|