Fasih-2B / config.json
HeshamHaroon's picture
Update config.json - SFT step 187
af592be verified
{
"model_type": "fasih",
"architectures": [
"GPT"
],
"sequence_len": 2048,
"vocab_size": 65536,
"n_layer": 24,
"n_head": 12,
"n_kv_head": 12,
"n_embd": 1536,
"window_pattern": "SSSL",
"framework": "nanochat",
"training": {
"stage": "sft",
"sft_step": 187,
"pretrain_steps": 15000,
"pretrain_tokens": "15.7B",
"sft_dataset": "InstAr-500k",
"val_bpb": 0.351,
"benchmarks": {
"ArabicMMLU": "31.95%",
"ACVA": "57.62%"
}
}
}