sergiopaniego HF Staff commited on
Commit
345d1e1
·
verified ·
1 Parent(s): abace48

Upload NemotronHForCausalLM

Browse files
Files changed (3) hide show
  1. config.json +2 -2
  2. generation_config.json +5 -8
  3. model.safetensors +2 -2
config.json CHANGED
@@ -20,9 +20,9 @@
20
  "mamba",
21
  "attention"
22
  ],
23
- "mamba_head_dim": 8,
24
  "mamba_hidden_act": "silu",
25
- "mamba_num_heads": 4,
26
  "mamba_proj_bias": false,
27
  "mamba_ssm_cache_dtype": "float32",
28
  "max_position_embeddings": 4096,
 
20
  "mamba",
21
  "attention"
22
  ],
23
+ "mamba_head_dim": 4,
24
  "mamba_hidden_act": "silu",
25
+ "mamba_num_heads": 8,
26
  "mamba_proj_bias": false,
27
  "mamba_ssm_cache_dtype": "float32",
28
  "max_position_embeddings": 4096,
generation_config.json CHANGED
@@ -1,13 +1,10 @@
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
4
- "do_sample": true,
5
- "eos_token_id": [
6
- 2,
7
- 11
8
- ],
9
  "pad_token_id": 0,
10
- "temperature": 1.0,
11
- "top_p": 1.0,
12
- "transformers_version": "5.3.0"
13
  }
 
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
4
+ "eos_token_id": 2,
5
+ "output_attentions": false,
6
+ "output_hidden_states": false,
 
 
7
  "pad_token_id": 0,
8
+ "transformers_version": "5.3.0",
9
+ "use_cache": true
 
10
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52e48197fa8403975baa3f2426192973fbc4859097b09a8c849eaa92f23e655c
3
- size 8444544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bf96d4f8045845e33623404b8d894cc9e6f8df654c74f077cdd0c14cdeeb438
3
+ size 8444696