File size: 711 Bytes
6134b5f | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 | {
"model_type": "tinyv4",
"architectures": ["TinyV4"],
"auto_map": {
"AutoModel": "modeling_tinyv4.TinyV4",
"AutoModelForCausalLM": "modeling_tinyv4.TinyV4"
},
"vocab_size": 32000,
"dim": 128,
"depth": 6,
"n_hc": 2,
"n_routed": 4,
"n_active": 2,
"n_shared": 1,
"expert_intermediate": 192,
"csa_m": 4,
"csa_topk": 16,
"hca_m": 8,
"n_win": 16,
"n_q_head": 4,
"head_dim": 48,
"d_c": 64,
"n_idx_head": 4,
"idx_head_dim": 48,
"n_out_group": 2,
"d_g": 64,
"rope_dim": 24,
"mtp_depth": 1,
"hash_layers": 2,
"max_len": 512,
"sinkhorn_iters": 20,
"aux_bias_update": 0.001,
"bal_loss_weight": 0.0001,
"step": 5000,
"best_loss": 3.9723572731018066
}
|