| { |
| "CUDA_VISIBLE_DEVICES": "0", |
| "USE_TORCH": "1", |
| "output_hidden_states": null, |
| "pretrained_model_name_or_path": "hfl/chinese-macbert-base", |
| "model_save_path": "../output/text_correction/model_public_csc", |
| "config_name": "csc.config", |
| "model_name": "pytorch_model.bin", |
| "path_train": "csc_public.train.json", |
| "path_dev": "csc_public.dev.json", |
| "path_tet": "csc_public.tet.json", |
| "scheduler_name": "cosine", |
| "tokenizer_type": "CHAR", |
| "padding_side": "RIGHT", |
| "active_type": "RELU", |
| "task_type": "CSC", |
| "model_type": "BERT", |
| "loss_type": "BCE", |
| "loss_det_rate": 0.3, |
| "max_len_limit": 512, |
| "batch_size": 32, |
| "num_labels": 0, |
| "max_len": 128, |
| "epochs": 3, |
| "lr": 3e-05, |
| "grad_accum_steps": 4, |
| "max_grad_norm": 1.0, |
| "weight_decay": 0.01, |
| "dropout_rate": 0.1, |
| "adam_eps": 1e-08, |
| "seed": 42, |
| "evaluate_steps": 1000, |
| "warmup_steps": 0.1, |
| "ignore_index": 0, |
| "save_steps": 1000, |
| "stop_epochs": 4, |
| "num_workers": 0, |
| "max_steps": -1, |
| "flag_save_model_state": true, |
| "flag_dynamic_encode": false, |
| "flag_tokenizer_char": true, |
| "flag_soft_label": true, |
| "flag_save_best": true, |
| "flag_dropout": false, |
| "flag_shuffle": true, |
| "flag_active": false, |
| "flag_train": false, |
| "flag_cuda": true, |
| "flag_mft": true, |
| "flag_adv": false, |
| "xy_keys_predict": [ |
| "original_text", |
| "correct_text", |
| "wrong_ids" |
| ], |
| "keys": [ |
| "original_text", |
| "correct_text", |
| "wrong_ids" |
| ], |
| "save_best_mertics_key": [ |
| "sentence", |
| "strict_cor_f1" |
| ], |
| "label_sep": "|myz|", |
| "multi_label_threshold": 0.5, |
| "len_rate": 1, |
| "adv_emb_name": "word_embeddings.", |
| "adv_eps": 1.0, |
| "additional_special_tokens": [], |
| "len_corpus": null, |
| "prior_count": null, |
| "prior": null, |
| "l2i": null, |
| "i2l": null, |
| "xy_keys": [ |
| "original_text", |
| "correct_text", |
| "wrong_ids" |
| ] |
| } |