Upload bart-large-cnn ONNX model

Browse files

Files changed (7) hide show

README.md +48 -0
config.json +68 -0
decoder_model.onnx +3 -0
decoder_with_past_model.onnx +3 -0
encoder_model.onnx +3 -0
merges.txt +0 -0
vocab.json +0 -0

README.md ADDED Viewed

	@@ -0,0 +1,48 @@

+---
+library_name: onnx
+tags:
+  - text2text-generation
+  - bart
+  - summarization
+  - encoder-decoder
+  - onnx
+  - inference4j
+license: apache-2.0
+pipeline_tag: summarization
+---
+# BART Large CNN — ONNX
+ONNX export of [BART Large CNN](https://huggingface.co/facebook/bart-large-cnn) (406M parameters) with encoder-decoder architecture and KV cache support.
+Fine-tuned for text summarization on the CNN/DailyMail dataset.
+Converted for use with [inference4j](https://github.com/inference4j/inference4j), an inference-only AI library for Java.
+## Original Source
+- **Repository:** [facebook/bart-large-cnn](https://huggingface.co/facebook/bart-large-cnn)
+- **License:** Apache 2.0
+## Usage with inference4j
+```java
+try (var summarizer = BartSummarizer.bartLargeCnn().build()) {
+    System.out.println(summarizer.summarize("Long article text..."));
+}
+```
+## Model Details
+| Property | Value |
+|----------|-------|
+| Architecture | BART encoder-decoder (406M parameters, 12 encoder + 12 decoder layers) |
+| Task | Text summarization |
+| Training data | CNN/DailyMail |
+| Tokenizer | BPE (50,265 tokens) |
+| Original framework | PyTorch (transformers) |
+| Export method | Hugging Face Optimum (encoder-decoder with KV cache) |
+## License
+This model is licensed under the [Apache License 2.0](https://www.apache.org/licenses/LICENSE-2.0). Original model by [Facebook AI](https://huggingface.co/facebook).

config.json ADDED Viewed

	@@ -0,0 +1,68 @@

+{
+  "_num_labels": 3,
+  "activation_dropout": 0.0,
+  "activation_function": "gelu",
+  "add_final_layer_norm": false,
+  "architectures": [
+    "BartForConditionalGeneration"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 0,
+  "classif_dropout": 0.0,
+  "classifier_dropout": 0.0,
+  "d_model": 1024,
+  "decoder_attention_heads": 16,
+  "decoder_ffn_dim": 4096,
+  "decoder_layerdrop": 0.0,
+  "decoder_layers": 12,
+  "decoder_start_token_id": 2,
+  "dropout": 0.1,
+  "dtype": "float32",
+  "early_stopping": null,
+  "encoder_attention_heads": 16,
+  "encoder_ffn_dim": 4096,
+  "encoder_layerdrop": 0.0,
+  "encoder_layers": 12,
+  "eos_token_id": 2,
+  "force_bos_token_to_be_generated": true,
+  "forced_eos_token_id": 2,
+  "gradient_checkpointing": false,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2"
+  },
+  "init_std": 0.02,
+  "is_encoder_decoder": true,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2
+  },
+  "length_penalty": null,
+  "max_length": null,
+  "max_position_embeddings": 1024,
+  "min_length": null,
+  "model_type": "bart",
+  "no_repeat_ngram_size": null,
+  "normalize_before": false,
+  "num_beams": null,
+  "num_hidden_layers": 12,
+  "output_past": true,
+  "pad_token_id": 1,
+  "prefix": " ",
+  "scale_embedding": false,
+  "task_specific_params": {
+    "summarization": {
+      "early_stopping": true,
+      "length_penalty": 2.0,
+      "max_length": 142,
+      "min_length": 56,
+      "no_repeat_ngram_size": 3,
+      "num_beams": 4
+    }
+  },
+  "transformers_version": "4.57.6",
+  "use_cache": true,
+  "vocab_size": 50264
+}

decoder_model.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ee2f468f76c5cf971baa3c9c7643cdb68eae2b0cfafbca3d4a7521dfda3bd067
+size 1222805764

decoder_with_past_model.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bf83b21384c46139c445444747191169a04aa769e1b165004c73c04caac039e2
+size 1122000148

encoder_model.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9d4be719088e992b5f18e25a5b10800a6934ae0fc5c67cd5e236e1f4bca61204
+size 814868677

merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

vocab.json ADDED Viewed

The diff for this file is too large to render. See raw diff