nvidia
/

Minitron-8B-Base

@@ -13,7 +13,7 @@
   "model_type": "nemotron",
   "num_attention_heads": 48,
   "num_hidden_layers": 32,
-  "kv_channels": 128,
   "num_key_value_heads": 8,
   "norm_eps": 1e-05,
   "rope_theta": 10000,

   "model_type": "nemotron",
   "num_attention_heads": 48,
   "num_hidden_layers": 32,
+  "head_dim": 128,
   "num_key_value_heads": 8,
   "norm_eps": 1e-05,
   "rope_theta": 10000,