tehkehyong commited on
Commit
4c4c6dd
·
verified ·
1 Parent(s): 7a73d8d

Adding ONNX file of this model

Browse files

Beep boop I am the [ONNX export bot 🤖🏎️](https://huggingface.co/spaces/onnx/export). On behalf of [tehkehyong](https://huggingface.co/tehkehyong), I would like to add to this repository the model converted to ONNX.

What is ONNX? It stands for "Open Neural Network Exchange", and is the most commonly used open standard for machine learning interoperability. You can find out more at [onnx.ai](https://onnx.ai/)!

The exported ONNX model can be then be consumed by various backends as TensorRT or TVM, or simply be used in a few lines with 🤗 Optimum through ONNX Runtime, check out how [here](https://huggingface.co/docs/optimum/main/en/onnxruntime/usage_guides/models)!

README.md CHANGED
@@ -5,6 +5,8 @@ language:
5
  library_name: transformers
6
  pipeline_tag: automatic-speech-recognition
7
  arxiv: https://arxiv.org/abs/2410.15608
 
 
8
  ---
9
  # Moonshine
10
 
 
5
  library_name: transformers
6
  pipeline_tag: automatic-speech-recognition
7
  arxiv: https://arxiv.org/abs/2410.15608
8
+ tags:
9
+ - onnx
10
  ---
11
  # Moonshine
12
 
onnx/config.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_attn_implementation_autoset": true,
3
+ "architectures": [
4
+ "MoonshineForConditionalGeneration"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 1,
9
+ "decoder_hidden_act": "silu",
10
+ "decoder_num_attention_heads": 8,
11
+ "decoder_num_hidden_layers": 8,
12
+ "decoder_num_key_value_heads": 8,
13
+ "decoder_start_token_id": 1,
14
+ "encoder_hidden_act": "gelu",
15
+ "encoder_num_attention_heads": 8,
16
+ "encoder_num_hidden_layers": 8,
17
+ "encoder_num_key_value_heads": 8,
18
+ "eos_token_id": 2,
19
+ "hidden_size": 416,
20
+ "initializer_range": 0.02,
21
+ "intermediate_size": 1664,
22
+ "is_encoder_decoder": true,
23
+ "max_position_embeddings": 194,
24
+ "model_type": "moonshine",
25
+ "pad_head_dim_to_multiple_of": 8,
26
+ "pad_token_id": 2,
27
+ "partial_rotary_factor": 0.62,
28
+ "rope_scaling": null,
29
+ "rope_theta": 10000.0,
30
+ "torch_dtype": "float32",
31
+ "transformers_version": "4.51.3",
32
+ "use_cache": true,
33
+ "vocab_size": 32768
34
+ }
onnx/decoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:787a50bff53d5e27c7ca33156d4c50275a5189203dd136b0bdcd76e90252b452
3
+ size 220550817
onnx/decoder_model_merged.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2843a351768822b22011efdde830033c6144620f7ce991b17376db6306cd69fc
3
+ size 221115751
onnx/decoder_with_past_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:feeadf4f0ec021cdebf953cab5b251fd8856889ed9180c30d083f6f150b1bebb
3
+ size 209453359
onnx/encoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85ff09b3d810666d37d98a3dccc1025ee4722ea1a556b5b1d1bdd85b5f583a5f
3
+ size 80900411
onnx/generation_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "decoder_start_token_id": 1,
5
+ "eos_token_id": 2,
6
+ "max_length": 194,
7
+ "pad_token_id": 2,
8
+ "transformers_version": "4.51.3"
9
+ }
onnx/preprocessor_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": false,
3
+ "feature_extractor_type": "Wav2Vec2FeatureExtractor",
4
+ "feature_size": 1,
5
+ "padding_side": "right",
6
+ "padding_value": 0.0,
7
+ "return_attention_mask": true,
8
+ "sampling_rate": 16000
9
+ }
onnx/special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {}
onnx/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
onnx/tokenizer_config.json ADDED
The diff for this file is too large to render. See raw diff