| { | |
| "lora_name": "falc7b_swift_contxt_230703_1", | |
| "always_override": true, | |
| "save_steps": 50.0, | |
| "micro_batch_size": 4, | |
| "batch_size": 32, | |
| "epochs": 1.0, | |
| "learning_rate": "1e-3", | |
| "lr_scheduler_type": "linear", | |
| "lora_rank": 64, | |
| "lora_alpha": 128, | |
| "lora_dropout": 0.05, | |
| "cutoff_len": 1024, | |
| "dataset": "None", | |
| "eval_dataset": "None", | |
| "format": "None", | |
| "eval_steps": 100.0, | |
| "raw_text_file": "swiftify_context_train", | |
| "overlap_len": 128, | |
| "newline_favor_len": 128, | |
| "higher_rank_limit": false, | |
| "warmup_steps": 30.0, | |
| "optimizer": "adamw_torch", | |
| "hard_cut_string": "\\n\\n\\n", | |
| "train_only_after": "", | |
| "stop_at_loss": 1.5 | |
| } |