Visual Question Answering
Transformers
Safetensors
Vietnamese
vision-encoder-decoder
image-text-to-text
# Load model directly
from transformers import AutoTokenizer, AutoModelForImageTextToText
tokenizer = AutoTokenizer.from_pretrained("TeeA/DONUT-ViChart")
model = AutoModelForImageTextToText.from_pretrained("TeeA/DONUT-ViChart")Quick Links
# Use a pipeline as a high-level helper from transformers import pipeline pipe = pipeline("visual-question-answering", model="TeeA/DONUT-ViChart")