mt5_extend_py2500 / t5marulog.jsonl
Kajiura Teruno
Expanded vocabulary by adding 2,500 words
4c1c18a
raw
history blame
535 Bytes
{"log": "trained", "date": "2023-07-03T20:46:17", "elapsed": "00:07:50", "model": "Roy029/mt5_extend_2500_new", "max_length": 128, "target_max_length": 128, "batch_size": 16, "gradient_accumulation_steps": 1, "train_steps": 4084, "accelerator": "gpu", "devices": "auto", "precision": 32, "strategy": "auto", "gradient_clip_val": 1.0, "compile": true, "solver": "adamw", "lr": 0.0003, "warmup_steps": 1, "training_steps": 100000, "adam_epsilon": 1e-08, "weight_decay": 0.0, "epoch": 5, "step": 3675, "saved": "mt5_extend_2500_new_tra"}