| { |
| "experiment": "ota_boun", |
| "name": "bert-base-turkish-cased", |
| "n_gpu": 1, |
| "model": { |
| "type": "MultiParser", |
| "args": { |
| "embeddings_processor": { |
| "type": "BertWrapper", |
| "args": { |
| "model_path": "data/pretrained_embeddings/bert-base-turkish-cased-nonpretrained", |
| "fine_tune": true, |
| "hidden_dropout": 0.2, |
| "attn_dropout": 0.2, |
| "output_dropout": 0.5, |
| "scalar_mix_layer_dropout": 0.1, |
| "token_mask_prob": 0.15 |
| } |
| }, |
| "outputs": { |
| "heads": { |
| "type": "ArcScorer", |
| "args": { |
| "scorer_class": "DeepBiaffineScorer", |
| "head_mode": "single_head", |
| "hidden_size": 768, |
| "dropout": 0.33, |
| "vocab": { |
| "type": "IntegerVocab" |
| } |
| } |
| }, |
| "labels": { |
| "type": "DependencyClassifier", |
| "args": { |
| "scorer_class": "DeepBiaffineScorer", |
| "hidden_size": 256, |
| "dropout": 0.33, |
| "vocab": { |
| "type": "BasicVocab", |
| "args": { |
| "vocab_filename": "data/corpora/ota_boun/vocab/basic.vocab" |
| } |
| } |
| } |
| } |
| }, |
| "post_processors": [ |
| { |
| "type": "FactorizedMSTPostProcessor", |
| "args": { |
| "annotation_ids": [ |
| "heads", |
| "labels" |
| ] |
| } |
| } |
| ] |
| } |
| }, |
| "data_loaders": { |
| "type": "BucketedCONLLLoader", |
| "args": { |
| "annotation_layers": { |
| "heads": { |
| "type": "TagSequence", |
| "source_column": 6, |
| "args": { |
| "ignore_root": true |
| } |
| }, |
| "labels": { |
| "type": "DependencyMatrix", |
| "source_column": [ |
| 6, |
| 7 |
| ], |
| "args": { |
| "ignore_non_relations": true |
| } |
| } |
| }, |
| "batch_size": 32, |
| "bucket_size": 256, |
| "max_tokens_per_batch": 156800, |
| "num_workers": 2 |
| }, |
| "paths": { |
| "train": "data/corpora/ota_boun/ota_boun-ud-train.conllu", |
| "dev": "data/corpora/ota_boun/ota_boun-ud-test.conllu", |
| "test": "data/corpora/ota_boun/tr_boun-ud-test.conllu" |
| } |
| }, |
| "trainer": { |
| "min_epochs": 15, |
| "max_epochs": 300, |
| "early_stop": 15, |
| "save_dir": "data/saved_models/", |
| "save_period": 20, |
| "verbosity": 2, |
| "validation_criterion": { |
| "metrics": { |
| "heads": "fscore", |
| "labels": "fscore" |
| }, |
| "weighting": "multiplicative" |
| }, |
| "optimizer": { |
| "type": "AdamW", |
| "args": { |
| "lr": 4e-05, |
| "weight_decay": 0.0 |
| } |
| }, |
| "lr_scheduler": { |
| "type": "LambdaLR", |
| "args": { |
| "lr_lambda": "SqrtSchedule(400)" |
| } |
| }, |
| "loss": { |
| "type": "CrossEntropyLoss", |
| "args": { |
| "ignore_index": -1 |
| } |
| } |
| } |
| } |