keveman commited on
Commit
0986ffe
·
verified ·
1 Parent(s): 9792ebd

Upload config.json

Browse files
Files changed (1) hide show
  1. config.json +54 -57
config.json CHANGED
@@ -1,74 +1,71 @@
1
  {
2
- "adapter_block_size": 4,
3
- "adapter_dropout": 0.1,
4
- "adapter_max_positions": 4096,
5
- "architectures": [
6
- "MoonshineStreamingForConditionalGeneration"
7
- ],
8
  "attention_bias": false,
9
- "attn_backend": "auto",
10
- "attn_dropout": 0.0,
11
  "bos_token_id": 1,
12
- "decoder_dim": 320,
13
- "decoder_num_attention_heads": 8,
14
- "decoder_num_hidden_layers": 6,
15
- "decoder_rotary_dim": 32,
16
  "decoder_start_token_id": 1,
17
- "dtype": "float32",
18
- "encoder_dim": 320,
19
- "encoder_num_attention_heads": 8,
20
- "encoder_num_hidden_layers": 6,
21
- "encoder_rotary_dim": 0,
22
- "encoder_window": [
23
- [
24
- 16,
25
- 4
26
- ],
27
- [
28
- 16,
29
- 4
30
- ],
31
- [
32
- 16,
33
- 0
34
- ],
35
- [
36
- 16,
37
- 0
38
- ],
39
- [
40
- 16,
41
- 4
42
- ],
43
- [
44
- 16,
45
- 4
 
 
 
 
 
 
 
 
 
 
46
  ]
47
- ],
 
48
  "eos_token_id": 2,
49
- "ff_dropout": 0.1,
50
  "ffn_mult": 4,
51
- "frame_ms": 5.0,
52
  "head_dim": 40,
 
 
 
53
  "is_encoder_decoder": true,
 
54
  "model_type": "moonshine_streaming",
 
 
55
  "num_key_value_heads": 8,
56
- "num_tokens_per_sec": 6.5,
57
  "pad_head_dim_to_multiple_of": null,
58
  "pad_token_id": 0,
59
- "preprocessor_asinh_k_init": 0.75,
60
- "preprocessor_c1": 640,
61
- "preprocessor_c2": 320,
62
- "preprocessor_input_dropout_p": 0.1,
63
- "preprocessor_input_dropout_sigma": 0.3,
64
- "preprocessor_k1": 5,
65
- "preprocessor_k2": 5,
66
- "rotary_base": 10000.0,
67
- "rotary_interpolation_factor": 1.0,
68
- "sample_rate": 16000,
69
  "transformers_version": "5.0.0.dev0",
70
  "use_cache": true,
71
- "use_swiglu_decoder": true,
72
- "use_swiglu_encoder": false,
73
  "vocab_size": 32768
74
  }
 
1
  {
 
 
 
 
 
 
2
  "attention_bias": false,
3
+ "attention_dropout": 0.0,
 
4
  "bos_token_id": 1,
 
 
 
 
5
  "decoder_start_token_id": 1,
6
+ "encoder_config": {
7
+ "attention_bias": false,
8
+ "attention_dropout": 0.0,
9
+ "frame_ms": 5.0,
10
+ "head_dim": 40,
11
+ "hidden_act": "gelu",
12
+ "hidden_size": 320,
13
+ "intermediate_size": 1280,
14
+ "max_position_embeddings": 4096,
15
+ "model_type": "moonshine_streaming_encoder",
16
+ "num_attention_heads": 8,
17
+ "num_hidden_layers": 6,
18
+ "num_key_value_heads": 8,
19
+ "sample_rate": 16000,
20
+ "sliding_windows": [
21
+ [
22
+ 16,
23
+ 4
24
+ ],
25
+ [
26
+ 16,
27
+ 4
28
+ ],
29
+ [
30
+ 16,
31
+ 0
32
+ ],
33
+ [
34
+ 16,
35
+ 0
36
+ ],
37
+ [
38
+ 16,
39
+ 4
40
+ ],
41
+ [
42
+ 16,
43
+ 4
44
+ ]
45
  ]
46
+ },
47
+ "encoder_hidden_size": 320,
48
  "eos_token_id": 2,
 
49
  "ffn_mult": 4,
 
50
  "head_dim": 40,
51
+ "hidden_act": "silu",
52
+ "hidden_size": 320,
53
+ "intermediate_size": 1280,
54
  "is_encoder_decoder": true,
55
+ "max_position_embeddings": 4096,
56
  "model_type": "moonshine_streaming",
57
+ "num_attention_heads": 8,
58
+ "num_hidden_layers": 6,
59
  "num_key_value_heads": 8,
 
60
  "pad_head_dim_to_multiple_of": null,
61
  "pad_token_id": 0,
62
+ "rope_parameters": {
63
+ "partial_rotary_factor": 0.8,
64
+ "rope_theta": 10000.0,
65
+ "rope_type": "default"
66
+ },
67
+ "tie_word_embeddings": false,
 
 
 
 
68
  "transformers_version": "5.0.0.dev0",
69
  "use_cache": true,
 
 
70
  "vocab_size": 32768
71
  }