| { |
| "lora_name": "wwpp", |
| "always_override": true, |
| "save_steps": 0.0, |
| "micro_batch_size": 12, |
| "batch_size": 768, |
| "epochs": 4.0, |
| "learning_rate": "2e-5", |
| "lr_scheduler_type": "linear", |
| "lora_rank": 64, |
| "lora_alpha": 128, |
| "lora_dropout": 0.05, |
| "cutoff_len": 256, |
| "dataset": "komt_squad", |
| "eval_dataset": "None", |
| "format": "alpaca-format", |
| "eval_steps": 100.0, |
| "raw_text_file": "None", |
| "overlap_len": 128, |
| "newline_favor_len": 128, |
| "higher_rank_limit": false, |
| "warmup_steps": 300.0, |
| "optimizer": "adamw_torch", |
| "hard_cut_string": "\\f", |
| "train_only_after": "", |
| "stop_at_loss": 0, |
| "add_eos_token": true, |
| "min_chars": null, |
| "report_to": "tensorboard" |
| } |