File size: 464 Bytes
d7de395 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 | {
"method": "drop_upcycling",
"drop_ratio": 0.66,
"num_experts_per_layer": 288,
"base_experts_from_ffn": 12,
"replication_factor": 24,
"total_experts": 8064,
"source_ffn_dim": 8960,
"target_expert_dim": 768,
"layers": 28,
"total_params": 28938036224,
"total_params_calculated": 28860965888,
"active_params_per_forward": 917464064,
"activation_ratio": 0.03170443415365876,
"expert_params": 3538944,
"total_expert_params": 28538044416
} |