| { | |
| "base_model": "google/functiongemma-270m-it", | |
| "dataset": "metga97/arabic-tooluse-functiongemma-v1", | |
| "max_seq_len": 1024, | |
| "epochs": 15, | |
| "lr": 5e-05, | |
| "weight_decay": 0.05, | |
| "warmup_ratio": 0.03, | |
| "grad_accum": 8, | |
| "per_device_bs": 8, | |
| "dtype": "torch.bfloat16" | |
| } |