| { | |
| "lora_name": "jql_llama_13b", | |
| "always_override": true, | |
| "save_steps": 0.0, | |
| "micro_batch_size": 8, | |
| "batch_size": 128, | |
| "epochs": 1.0, | |
| "learning_rate": "3e-4", | |
| "lr_scheduler_type": "linear", | |
| "lora_rank": 32, | |
| "lora_alpha": 64, | |
| "lora_dropout": 0.05, | |
| "cutoff_len": 256, | |
| "dataset": "jql_chat_gpt_v2", | |
| "eval_dataset": "None", | |
| "format": "jql-format", | |
| "eval_steps": 100.0, | |
| "raw_text_file": "None", | |
| "overlap_len": 128, | |
| "newline_favor_len": 128, | |
| "higher_rank_limit": false, | |
| "warmup_steps": 100.0, | |
| "optimizer": "adamw_torch", | |
| "hard_cut_string": "\\n\\n\\n", | |
| "train_only_after": "" | |
| } |