# Load model directly
from transformers import AutoTokenizer, AutoModelForImageTextToText
tokenizer = AutoTokenizer.from_pretrained("fxmarty/tiny-doc-qa-vision-encoder-decoder")
model = AutoModelForImageTextToText.from_pretrained("fxmarty/tiny-doc-qa-vision-encoder-decoder")Quick Links
# Use a pipeline as a high-level helper from transformers import pipeline pipe = pipeline("document-question-answering", model="fxmarty/tiny-doc-qa-vision-encoder-decoder")