Upload 10 files
Browse filesonnx converted model for finetuned distilbert NER
- config.json +2 -3
- onnx/model.onnx +3 -0
- onnx/model_fp16.onnx +3 -0
- onnx/model_q4.onnx +3 -0
- onnx/model_quantized.onnx +3 -0
- quantize_config.json +11 -0
config.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
{
|
| 2 |
-
"_name_or_path": "
|
| 3 |
"activation": "gelu",
|
| 4 |
"architectures": [
|
| 5 |
"DistilBertForTokenClassification"
|
|
@@ -41,7 +41,6 @@
|
|
| 41 |
"seq_classif_dropout": 0.2,
|
| 42 |
"sinusoidal_pos_embds": false,
|
| 43 |
"tie_weights_": true,
|
| 44 |
-
"
|
| 45 |
-
"transformers_version": "4.44.2",
|
| 46 |
"vocab_size": 28996
|
| 47 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"_name_or_path": "Mozilla/distilbert-NER-LoRA",
|
| 3 |
"activation": "gelu",
|
| 4 |
"architectures": [
|
| 5 |
"DistilBertForTokenClassification"
|
|
|
|
| 41 |
"seq_classif_dropout": 0.2,
|
| 42 |
"sinusoidal_pos_embds": false,
|
| 43 |
"tie_weights_": true,
|
| 44 |
+
"transformers_version": "4.43.4",
|
|
|
|
| 45 |
"vocab_size": 28996
|
| 46 |
}
|
onnx/model.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:626fe45d2038e3894b781599696af0376a2431346b492f71bbd351bac41ebe8c
|
| 3 |
+
size 260940064
|
onnx/model_fp16.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b1b6ca590bf7f28e82adc87df888fe1811a0022043de48ea92432508333d9ee1
|
| 3 |
+
size 130544330
|
onnx/model_q4.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:04e01cb093d6a8afba3b6d40c52943ce7c0082fdba87b6d00104d9e7a062a2d7
|
| 3 |
+
size 117594921
|
onnx/model_quantized.onnx
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9219cbe3e4c3bd072b22464dfeb57cf3dc1b583e5d61d5282d64cf49d9922db8
|
| 3 |
+
size 65788336
|
quantize_config.json
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"modes": [
|
| 3 |
+
"q4"
|
| 4 |
+
],
|
| 5 |
+
"per_channel": true,
|
| 6 |
+
"reduce_range": true,
|
| 7 |
+
"block_size": null,
|
| 8 |
+
"is_symmetric": true,
|
| 9 |
+
"accuracy_level": null,
|
| 10 |
+
"quant_type": 1
|
| 11 |
+
}
|