deepseek-v3-mini / model_metadata.json
Mostafa8Mehrabi's picture
Upload COMPLETE FIXED DeepSeek-V3 Mini - All issues resolved (~181M parameters, no warnings)
25d5f86 verified
{
"tied_weights": [],
"tie_word_embeddings": true,
"original_param_count": 181320192,
"weights_properly_tied": true,
"embedding_params": 38597376,
"model_type": "deepseek_v3_mini",
"attention_mask_fixed": true,
"pad_token_id": 50255,
"eos_token_id": 50256,
"pad_token_different_from_eos": true
}