Adding ONNX file of this model
Browse filesBeep boop I am the [ONNX export bot 🤖🏎️](https://huggingface.co/spaces/onnx/export). On behalf of [halwarsing](https://huggingface.co/halwarsing), I would like to add to this repository the model converted to ONNX.
What is ONNX? It stands for "Open Neural Network Exchange", and is the most commonly used open standard for machine learning interoperability. You can find out more at [onnx.ai](https://onnx.ai/)!
The exported ONNX model can be then be consumed by various backends as TensorRT or TVM, or simply be used in a few lines with 🤗 Optimum through ONNX Runtime, check out how [here](https://huggingface.co/docs/optimum/main/en/onnxruntime/usage_guides/models)!
- .gitattributes +1 -0
- README.md +1 -1
- onnx/config.json +82 -0
- onnx/generation_config.json +7 -0
- onnx/merges.txt +0 -0
- onnx/model.onnx +3 -0
- onnx/model.onnx_data +3 -0
- onnx/special_tokens_map.json +30 -0
- onnx/tokenizer.json +0 -0
- onnx/tokenizer_config.json +22 -0
- onnx/vocab.json +0 -0
.gitattributes
CHANGED
|
@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 32 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 33 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 32 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 33 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 35 |
+
onnx/model.onnx_data filter=lfs diff=lfs merge=lfs -text
|
README.md
CHANGED
|
@@ -2,10 +2,10 @@
|
|
| 2 |
license: creativeml-openrail-m
|
| 3 |
language:
|
| 4 |
- en
|
| 5 |
-
thumbnail:
|
| 6 |
tags:
|
| 7 |
- text generation
|
| 8 |
- conversational
|
|
|
|
| 9 |
inference: false
|
| 10 |
---
|
| 11 |
|
|
|
|
| 2 |
license: creativeml-openrail-m
|
| 3 |
language:
|
| 4 |
- en
|
|
|
|
| 5 |
tags:
|
| 6 |
- text generation
|
| 7 |
- conversational
|
| 8 |
+
- onnx
|
| 9 |
inference: false
|
| 10 |
---
|
| 11 |
|
onnx/config.json
ADDED
|
@@ -0,0 +1,82 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_attn_implementation_autoset": true,
|
| 3 |
+
"activation_function": "gelu_new",
|
| 4 |
+
"architectures": [
|
| 5 |
+
"GPTNeoForCausalLM"
|
| 6 |
+
],
|
| 7 |
+
"attention_dropout": 0,
|
| 8 |
+
"attention_layers": [
|
| 9 |
+
"global",
|
| 10 |
+
"local",
|
| 11 |
+
"global",
|
| 12 |
+
"local",
|
| 13 |
+
"global",
|
| 14 |
+
"local",
|
| 15 |
+
"global",
|
| 16 |
+
"local",
|
| 17 |
+
"global",
|
| 18 |
+
"local",
|
| 19 |
+
"global",
|
| 20 |
+
"local",
|
| 21 |
+
"global",
|
| 22 |
+
"local",
|
| 23 |
+
"global",
|
| 24 |
+
"local",
|
| 25 |
+
"global",
|
| 26 |
+
"local",
|
| 27 |
+
"global",
|
| 28 |
+
"local",
|
| 29 |
+
"global",
|
| 30 |
+
"local",
|
| 31 |
+
"global",
|
| 32 |
+
"local",
|
| 33 |
+
"global",
|
| 34 |
+
"local",
|
| 35 |
+
"global",
|
| 36 |
+
"local",
|
| 37 |
+
"global",
|
| 38 |
+
"local",
|
| 39 |
+
"global",
|
| 40 |
+
"local"
|
| 41 |
+
],
|
| 42 |
+
"attention_types": [
|
| 43 |
+
[
|
| 44 |
+
[
|
| 45 |
+
"global",
|
| 46 |
+
"local"
|
| 47 |
+
],
|
| 48 |
+
16
|
| 49 |
+
]
|
| 50 |
+
],
|
| 51 |
+
"bos_token_id": 50256,
|
| 52 |
+
"classifier_dropout": 0.1,
|
| 53 |
+
"embed_dropout": 0,
|
| 54 |
+
"eos_token_id": 50256,
|
| 55 |
+
"hidden_size": 2560,
|
| 56 |
+
"initializer_range": 0.02,
|
| 57 |
+
"intermediate_size": null,
|
| 58 |
+
"layer_norm_epsilon": 1e-05,
|
| 59 |
+
"max_position_embeddings": 2048,
|
| 60 |
+
"model_type": "gpt_neo",
|
| 61 |
+
"num_heads": 20,
|
| 62 |
+
"num_layers": 32,
|
| 63 |
+
"resid_dropout": 0,
|
| 64 |
+
"summary_activation": null,
|
| 65 |
+
"summary_first_dropout": 0.1,
|
| 66 |
+
"summary_proj_to_labels": true,
|
| 67 |
+
"summary_type": "cls_index",
|
| 68 |
+
"summary_use_proj": true,
|
| 69 |
+
"task_specific_params": {
|
| 70 |
+
"text-generation": {
|
| 71 |
+
"do_sample": true,
|
| 72 |
+
"max_length": 50,
|
| 73 |
+
"temperature": 0.9
|
| 74 |
+
}
|
| 75 |
+
},
|
| 76 |
+
"tokenizer_class": "GPT2Tokenizer",
|
| 77 |
+
"torch_dtype": "float32",
|
| 78 |
+
"transformers_version": "4.51.3",
|
| 79 |
+
"use_cache": false,
|
| 80 |
+
"vocab_size": 50257,
|
| 81 |
+
"window_size": 256
|
| 82 |
+
}
|
onnx/generation_config.json
ADDED
|
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_from_model_config": true,
|
| 3 |
+
"bos_token_id": 50256,
|
| 4 |
+
"eos_token_id": 50256,
|
| 5 |
+
"transformers_version": "4.51.3",
|
| 6 |
+
"use_cache": false
|
| 7 |
+
}
|
onnx/merges.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
onnx/model.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ea5b9d896048ad6391ed2a83a7dff34fbfc2732683552ab6014ace8a1765a6c9
|
| 3 |
+
size 979496
|
onnx/model.onnx_data
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:afd1623bbda9d723b7d405a3f03f196f0a231c1789dca0eef88169b91a4b1edb
|
| 3 |
+
size 11128250368
|
onnx/special_tokens_map.json
ADDED
|
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token": {
|
| 3 |
+
"content": "<|endoftext|>",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"eos_token": {
|
| 10 |
+
"content": "<|endoftext|>",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"pad_token": {
|
| 17 |
+
"content": "<|endoftext|>",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
+
"unk_token": {
|
| 24 |
+
"content": "<|endoftext|>",
|
| 25 |
+
"lstrip": false,
|
| 26 |
+
"normalized": false,
|
| 27 |
+
"rstrip": false,
|
| 28 |
+
"single_word": false
|
| 29 |
+
}
|
| 30 |
+
}
|
onnx/tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
onnx/tokenizer_config.json
ADDED
|
@@ -0,0 +1,22 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_prefix_space": false,
|
| 3 |
+
"added_tokens_decoder": {
|
| 4 |
+
"50256": {
|
| 5 |
+
"content": "<|endoftext|>",
|
| 6 |
+
"lstrip": false,
|
| 7 |
+
"normalized": false,
|
| 8 |
+
"rstrip": false,
|
| 9 |
+
"single_word": false,
|
| 10 |
+
"special": true
|
| 11 |
+
}
|
| 12 |
+
},
|
| 13 |
+
"bos_token": "<|endoftext|>",
|
| 14 |
+
"clean_up_tokenization_spaces": false,
|
| 15 |
+
"eos_token": "<|endoftext|>",
|
| 16 |
+
"errors": "replace",
|
| 17 |
+
"extra_special_tokens": {},
|
| 18 |
+
"model_max_length": 2048,
|
| 19 |
+
"pad_token": "<|endoftext|>",
|
| 20 |
+
"tokenizer_class": "GPT2Tokenizer",
|
| 21 |
+
"unk_token": "<|endoftext|>"
|
| 22 |
+
}
|
onnx/vocab.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|