| { | |
| "base_model": "Qwen/Qwen3-8B", | |
| "dtype": "bfloat16", | |
| "lora": { | |
| "r": 16, | |
| "alpha": 32, | |
| "dropout": 0.05, | |
| "targets": [ | |
| "q_proj", | |
| "k_proj", | |
| "v_proj", | |
| "o_proj" | |
| ] | |
| }, | |
| "max_seq_length": 384 | |
| } |
| { | |
| "base_model": "Qwen/Qwen3-8B", | |
| "dtype": "bfloat16", | |
| "lora": { | |
| "r": 16, | |
| "alpha": 32, | |
| "dropout": 0.05, | |
| "targets": [ | |
| "q_proj", | |
| "k_proj", | |
| "v_proj", | |
| "o_proj" | |
| ] | |
| }, | |
| "max_seq_length": 384 | |
| } |