| optim: |
| gradient_clip: |
| active: active |
| clip: 0.01 |
| cls: AdamW |
| param: |
| lr: 3.0e-05 |
| betas: |
| - 0.9 |
| - 0.999 |
| eps: 1.0e-06 |
| weight_decay: 0.01 |
| amsgrad: false |
| loss: |
| class_weight: |
| active: true |
| seed: 1234 |
| device: |
| device: cuda |
| n_gpu: 8 |
| model: |
| bert: |
| name: roberta_base_ja_20190121_m10000_v24000_u500000 |
| train: |
| epoch: 10 |
| batch_size: 400 |
| eval: |
| batch_size: 800 |
| data: |
| wikipedia: |
| debug_size: null |
| dir: ./dataset/jawiki-20190121-cirrussearch-content |
| add_dir: ./outputs/large_el_base_wikilink_extention/predicts/jawiki-20190121-cirrussearch-content |
| filter_no_link: false |
| ene: |
| path: ./dataset/Shinra2023_Classification_train_20230416.jsonl |
| add_path: ./outputs/ene_classifier/jawiki-20190121-cirrussearch-content/predict.jsonl |
| encoding: BIOUL |
| dev_size: 100 |
| seq_len: 512 |
| dup_len: 32 |
| dataloader: |
| num_workers: 8 |
| setting: |
| trainer: |
| cls: BaselineTrainer |
| type: |
| dataset: |
| cls: NERCRFDataset |
| model: |
| cls: NERCRFModel |
| crf: |
| cls: PatialEERCRF |
| partial: true |
| add_se_tag: true |
| eer: |
| ratio: null |
| margin: 0.0 |
| weight: 10 |
|
|