vad-macbert / training_args.json
Pectics's picture
Initial commit
16cbc1c
raw
history blame contribute delete
729 Bytes
{
"batch_size": 32,
"data_path": "train/en-zh_cn_vad_mix.csv",
"dtype": "fp16",
"encoding": "utf-8",
"epochs": 4,
"errors": "ignore",
"eval_batch_size": 0,
"eval_batches": 200,
"eval_every": 100,
"eval_ratio": 0.01,
"grad_accum_steps": 4,
"huber_delta": 1.0,
"learning_rate": 1e-05,
"log_every": 1,
"loss": "huber",
"max_length": 512,
"max_rows": null,
"max_steps": 5000,
"min_chars": 2,
"model_name": "hfl/chinese-macbert-base",
"num_labels": 3,
"num_rows": 400000,
"output_dir": "train/vad-macbert-mix",
"resume_from": "train/vad-macbert-long/best",
"save_every": 100,
"seed": 42,
"shuffle_buffer": 4096,
"warmup_ratio": 0.1,
"warmup_steps": 0,
"weight_decay": 0.01
}