polieste
/

fastAbs_large

text2text-generation

text-generation-inference

Model card Files Files and versions

polieste commited on Jan 8, 2024

Commit

61d393a

·

1 Parent(s): c3d4b5c

Update README.md

Files changed (1) hide show

README.md +3 -16

README.md CHANGED Viewed

@@ -8,7 +8,7 @@ tags:
 license: mit
 widget:
-- text: "vietnews: VietAI là tổ chức phi lợi nhuận với sứ mệnh ươm mầm tài năng về trí tuệ nhân tạo và xây dựng một cộng đồng các chuyên gia trong lĩnh vực trí tuệ nhân tạo đẳng cấp quốc tế tại Việt Nam."
 ---
 # ViT5-large Finetuned on `vietnews` Abstractive Summarization
@@ -28,29 +28,16 @@ tokenizer = AutoTokenizer.from_pretrained("VietAI/vit5-large-vietnews-summarizat
 model = AutoModelForSeq2SeqLM.from_pretrained("VietAI/vit5-large-vietnews-summarization")
 model.cuda()
-sentence = "VietAI là tổ chức phi lợi nhuận với sứ mệnh ươm mầm tài năng về trí tuệ nhân tạo và xây dựng một cộng đồng các chuyên gia trong lĩnh vực trí tuệ nhân tạo đẳng cấp quốc tế tại Việt Nam."
 text =  "vietnews: " + sentence + " </s>"
 encoding = tokenizer(text, return_tensors="pt")
 input_ids, attention_masks = encoding["input_ids"].to("cuda"), encoding["attention_mask"].to("cuda")
 outputs = model.generate(
     input_ids=input_ids, attention_mask=attention_masks,
-    max_length=256,
     early_stopping=True
 )
 for output in outputs:
     line = tokenizer.decode(output, skip_special_tokens=True, clean_up_tokenization_spaces=True)
     print(line)
 ```
-## Citation
-```
-@inproceedings{phan-etal-2022-vit5,
-    title = "{V}i{T}5: Pretrained Text-to-Text Transformer for {V}ietnamese Language Generation",
-    author = "Phan, Long and Tran, Hieu and Nguyen, Hieu and Trinh, Trieu H.",
-    booktitle = "Proceedings of the 2022 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies: Student Research Workshop",
-    year = "2022",
-    publisher = "Association for Computational Linguistics",
-    url = "https://aclanthology.org/2022.naacl-srw.18",
-    pages = "136--142",
-}
-```

 license: mit
 widget:
+- text: "Input text."
 ---
 # ViT5-large Finetuned on `vietnews` Abstractive Summarization
 model = AutoModelForSeq2SeqLM.from_pretrained("VietAI/vit5-large-vietnews-summarization")
 model.cuda()
+sentence = "Input text"
 text =  "vietnews: " + sentence + " </s>"
 encoding = tokenizer(text, return_tensors="pt")
 input_ids, attention_masks = encoding["input_ids"].to("cuda"), encoding["attention_mask"].to("cuda")
 outputs = model.generate(
     input_ids=input_ids, attention_mask=attention_masks,
+    max_length=128,
     early_stopping=True
 )
 for output in outputs:
     line = tokenizer.decode(output, skip_special_tokens=True, clean_up_tokenization_spaces=True)
     print(line)
 ```