| { | |
| "batch_size": 32, | |
| "data_path": "train/en-zh_cn_vad_mix.csv", | |
| "dtype": "fp16", | |
| "encoding": "utf-8", | |
| "epochs": 4, | |
| "errors": "ignore", | |
| "eval_batch_size": 0, | |
| "eval_batches": 200, | |
| "eval_every": 100, | |
| "eval_ratio": 0.01, | |
| "grad_accum_steps": 4, | |
| "huber_delta": 1.0, | |
| "learning_rate": 1e-05, | |
| "log_every": 1, | |
| "loss": "huber", | |
| "max_length": 512, | |
| "max_rows": null, | |
| "max_steps": 5000, | |
| "min_chars": 2, | |
| "model_name": "hfl/chinese-macbert-base", | |
| "num_labels": 3, | |
| "num_rows": 400000, | |
| "output_dir": "train/vad-macbert-mix", | |
| "resume_from": "train/vad-macbert-long/best", | |
| "save_every": 100, | |
| "seed": 42, | |
| "shuffle_buffer": 4096, | |
| "warmup_ratio": 0.1, | |
| "warmup_steps": 0, | |
| "weight_decay": 0.01 | |
| } |