Macropodus
/

macbert4mdcspell_v1

Text Generation

chinses-spelling-correct

chinese-spelling-check

中文拼写纠错

Model card Files Files and versions

macbert4mdcspell_v1 / csc.config

Macropodus's picture

Upload 7 files

6372da2 verified over 1 year ago

2.04 kB

	{
	"CUDA_VISIBLE_DEVICES": "0",
	"USE_TORCH": "1",
	"output_hidden_states": null,
	"pretrained_model_name_or_path": "hfl/chinese-macbert-base",
	"model_save_path": "../output/text_correction/model_public_csc",
	"config_name": "csc.config",
	"model_name": "pytorch_model.bin",
	"path_train": "csc_public.train.json",
	"path_dev": "csc_public.dev.json",
	"path_tet": "csc_public.tet.json",
	"scheduler_name": "cosine",
	"tokenizer_type": "CHAR",
	"padding_side": "RIGHT",
	"active_type": "RELU",
	"task_type": "CSC",
	"model_type": "BERT",
	"loss_type": "BCE",
	"loss_det_rate": 0.3,
	"max_len_limit": 512,
	"batch_size": 32,
	"num_labels": 0,
	"max_len": 128,
	"epochs": 3,
	"lr": 3e-05,
	"grad_accum_steps": 4,
	"max_grad_norm": 1.0,
	"weight_decay": 0.01,
	"dropout_rate": 0.1,
	"adam_eps": 1e-08,
	"seed": 42,
	"evaluate_steps": 1000,
	"warmup_steps": 0.1,
	"ignore_index": 0,
	"save_steps": 1000,
	"stop_epochs": 4,
	"num_workers": 0,
	"max_steps": -1,
	"flag_save_model_state": true,
	"flag_dynamic_encode": false,
	"flag_tokenizer_char": true,
	"flag_soft_label": true,
	"flag_save_best": true,
	"flag_dropout": false,
	"flag_shuffle": true,
	"flag_active": false,
	"flag_train": false,
	"flag_cuda": true,
	"flag_mft": true,
	"flag_adv": false,
	"xy_keys_predict": [
	"original_text",
	"correct_text",
	"wrong_ids"
	],
	"keys": [
	"original_text",
	"correct_text",
	"wrong_ids"
	],
	"save_best_mertics_key": [
	"sentence",
	"strict_cor_f1"
	],
	"label_sep": "\|myz\|",
	"multi_label_threshold": 0.5,
	"len_rate": 1,
	"adv_emb_name": "word_embeddings.",
	"adv_eps": 1.0,
	"additional_special_tokens": [],
	"len_corpus": null,
	"prior_count": null,
	"prior": null,
	"l2i": null,
	"i2l": null,
	"xy_keys": [
	"original_text",
	"correct_text",
	"wrong_ids"
	]
	}