HyperAccel commited on
Commit
84134db
·
verified ·
1 Parent(s): a16d03a

Upload tiny-random nemotron_h model

Browse files
Files changed (2) hide show
  1. config.json +2 -2
  2. model.safetensors +2 -2
config.json CHANGED
@@ -40,7 +40,7 @@
40
  "mlp_hidden_act": "relu2",
41
  "model_type": "nemotron_h",
42
  "moe_intermediate_size": 256,
43
- "moe_latent_size": null,
44
  "moe_shared_expert_intermediate_size": 512,
45
  "moe_shared_expert_overlap": true,
46
  "mtp_layers_block_type": [
@@ -57,7 +57,7 @@
57
  "num_experts_per_tok": 2,
58
  "num_key_value_heads": 2,
59
  "num_logits_to_keep": 1,
60
- "num_nextn_predict_layers": 0,
61
  "pad_token_id": 0,
62
  "partial_rotary_factor": 1.0,
63
  "prefix": null,
 
40
  "mlp_hidden_act": "relu2",
41
  "model_type": "nemotron_h",
42
  "moe_intermediate_size": 256,
43
+ "moe_latent_size": 256,
44
  "moe_shared_expert_intermediate_size": 512,
45
  "moe_shared_expert_overlap": true,
46
  "mtp_layers_block_type": [
 
57
  "num_experts_per_tok": 2,
58
  "num_key_value_heads": 2,
59
  "num_logits_to_keep": 1,
60
+ "num_nextn_predict_layers": 1,
61
  "pad_token_id": 0,
62
  "partial_rotary_factor": 1.0,
63
  "prefix": null,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ec18d6b76cdf5babb27b2d46b619217600f08a5c52781a4542ca054a6a95d11
3
- size 287199248
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0473059033b81699665869718a074ce39ec4e1f2a4edeafc6f54348b41b2bf3
3
+ size 286151152