File size: 278 Bytes
dd0024e
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
{
  "base_model": "google/functiongemma-270m-it",
  "dataset": "metga97/arabic-tooluse-functiongemma-v1",
  "max_seq_len": 1024,
  "epochs": 15,
  "lr": 5e-05,
  "weight_decay": 0.05,
  "warmup_ratio": 0.03,
  "grad_accum": 8,
  "per_device_bs": 8,
  "dtype": "torch.bfloat16"
}