echarlaix HF Staff commited on
Commit
33e9661
·
1 Parent(s): e233289

Set config.use_mem_rope to True

Browse files
config.json CHANGED
@@ -12,6 +12,7 @@
12
  "conv_kernel": 3,
13
  "d_model": 16,
14
  "d_state": 32,
 
15
  "eos_token_id": 2,
16
  "expand": 2,
17
  "hidden_act": "gelu",
@@ -44,18 +45,21 @@
44
  "num_query_groups": 32,
45
  "pad_token_id": 0,
46
  "rms_norm_eps": 1e-05,
47
- "rope_theta": 10000,
 
 
 
 
48
  "time_step_floor": 0.0001,
49
  "time_step_limit": null,
50
  "time_step_max": 0.1,
51
  "time_step_min": 0.001,
52
- "torch_dtype": "float32",
53
- "transformers_version": "4.55.4",
54
  "use_cache": true,
55
  "use_conv_bias": true,
56
  "use_long_context": false,
57
  "use_mem_eff_path": false,
58
- "use_mem_rope": false,
59
  "use_shared_attention_adapter": false,
60
  "vocab_size": 50280
61
  }
 
12
  "conv_kernel": 3,
13
  "d_model": 16,
14
  "d_state": 32,
15
+ "dtype": "float32",
16
  "eos_token_id": 2,
17
  "expand": 2,
18
  "hidden_act": "gelu",
 
45
  "num_query_groups": 32,
46
  "pad_token_id": 0,
47
  "rms_norm_eps": 1e-05,
48
+ "rope_parameters": {
49
+ "rope_theta": 10000,
50
+ "rope_type": "default"
51
+ },
52
+ "tie_word_embeddings": true,
53
  "time_step_floor": 0.0001,
54
  "time_step_limit": null,
55
  "time_step_max": 0.1,
56
  "time_step_min": 0.001,
57
+ "transformers_version": "5.0.0",
 
58
  "use_cache": true,
59
  "use_conv_bias": true,
60
  "use_long_context": false,
61
  "use_mem_eff_path": false,
62
+ "use_mem_rope": true,
63
  "use_shared_attention_adapter": false,
64
  "vocab_size": 50280
65
  }
generation_config.json CHANGED
@@ -3,5 +3,5 @@
3
  "bos_token_id": 1,
4
  "eos_token_id": 2,
5
  "pad_token_id": 0,
6
- "transformers_version": "4.55.4"
7
  }
 
3
  "bos_token_id": 1,
4
  "eos_token_id": 2,
5
  "pad_token_id": 0,
6
+ "transformers_version": "5.0.0"
7
  }
pytorch_model.bin → model.safetensors RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa28ee93e29e40c5fc35e5727122220d5dc937b65f27f71995c8edbb056e551c
3
- size 3408858
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:257244fe95a815ccdfc00b230826eb464c8b6bfc791d6e8c35ec7a0e470ae4fb
3
+ size 3398168