{ "batch_size": 32, "data_path": "train/en-zh_cn_vad_mix.csv", "dtype": "fp16", "encoding": "utf-8", "epochs": 4, "errors": "ignore", "eval_batch_size": 0, "eval_batches": 200, "eval_every": 100, "eval_ratio": 0.01, "grad_accum_steps": 4, "huber_delta": 1.0, "learning_rate": 1e-05, "log_every": 1, "loss": "huber", "max_length": 512, "max_rows": null, "max_steps": 5000, "min_chars": 2, "model_name": "hfl/chinese-macbert-base", "num_labels": 3, "num_rows": 400000, "output_dir": "train/vad-macbert-mix", "resume_from": "train/vad-macbert-long/best", "save_every": 100, "seed": 42, "shuffle_buffer": 4096, "warmup_ratio": 0.1, "warmup_steps": 0, "weight_decay": 0.01 }