| { | |
| "output_dir": "../drive/MyDrive/NICE/model/0430_train_less", | |
| "model_name_or_path": "../drive/MyDrive/NICE/model/cap_best/OFA-huge-caption", | |
| "train_caption_file": "./data/train_caption_catAdded.jsonl", | |
| "train_image_file": "../drive/MyDrive/NICE/train_image.tsv", | |
| "test_caption_file": null, | |
| "test_image_file": null, | |
| "freeze_encoder": false, | |
| "freeze_word_embed": false, | |
| "num_train_epochs": 20, | |
| "max_steps": -1, | |
| "per_device_train_batch_size": 12, | |
| "per_device_eval_batch_size": 256, | |
| "learning_rate": 5e-05, | |
| "max_seq_length": 150, | |
| "logging_steps": 500, | |
| "save_steps": 5000, | |
| "save_total_limit": 1, | |
| "lr_scheduler_type": "cosine", | |
| "warmup_steps": 400, | |
| "warmup_ratio": 0, | |
| "gradient_accumulation_steps": 1, | |
| "optim": "adamw_torch", | |
| "seed": 69, | |
| "fp16": false, | |
| "no_cuda": false, | |
| "dataloader_num_workers": 8, | |
| "save_strategy": "steps", | |
| "weight_decay": 0.01, | |
| "max_grad_norm": 1.0, | |
| "remove_unused_columns": false | |
| } |