Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -3,7 +3,7 @@ import os
|
|
| 3 |
import cv2
|
| 4 |
import pandas as pd
|
| 5 |
from PIL import Image
|
| 6 |
-
from transformers import VisionEncoderDecoderModel,
|
| 7 |
import nltk
|
| 8 |
import tempfile
|
| 9 |
import zipfile
|
|
@@ -14,7 +14,7 @@ nltk.download('omw-1.4')
|
|
| 14 |
# Load the pre-trained models for image captioning and summarization
|
| 15 |
model_name = "NourFakih/Vit-GPT2-COCO2017Flickr-85k-09"
|
| 16 |
model = VisionEncoderDecoderModel.from_pretrained(model_name)
|
| 17 |
-
feature_extractor =
|
| 18 |
tokenizer = AutoTokenizer.from_pretrained(model_name)
|
| 19 |
|
| 20 |
model_sum_name = "google-t5/t5-base"
|
|
|
|
| 3 |
import cv2
|
| 4 |
import pandas as pd
|
| 5 |
from PIL import Image
|
| 6 |
+
from transformers import VisionEncoderDecoderModel, ViTImageProcessor, AutoTokenizer, pipeline, AutoModelForSeq2SeqLM
|
| 7 |
import nltk
|
| 8 |
import tempfile
|
| 9 |
import zipfile
|
|
|
|
| 14 |
# Load the pre-trained models for image captioning and summarization
|
| 15 |
model_name = "NourFakih/Vit-GPT2-COCO2017Flickr-85k-09"
|
| 16 |
model = VisionEncoderDecoderModel.from_pretrained(model_name)
|
| 17 |
+
feature_extractor = ViTImageProcessor.from_pretrained(model_name)
|
| 18 |
tokenizer = AutoTokenizer.from_pretrained(model_name)
|
| 19 |
|
| 20 |
model_sum_name = "google-t5/t5-base"
|