Spaces:

Uzaiir
/

Image2Story

Sleeping

Uzaiir commited on May 27

Commit

cd0ce91

verified ·

1 Parent(s): 3649d2e

Update src/models/imageCaptioning.py

Files changed (1) hide show

src/models/imageCaptioning.py CHANGED Viewed

@@ -1,24 +1,41 @@
-import requests
-import base64
-import os
-hf_token = os.environ.get("HUGGINGFACE_API_TOKEN")
-API_URL = "https://api-inference.huggingface.co/models/nlpconnect/vit-gpt2-image-captioning"
-headers = {
-    "Authorization": f"Bearer {hf_token}"
-}
-def generateCaption(image_path):
-    with open(image_path, "rb") as image_file:
-        image_bytes = image_file.read()
-    response = requests.post(API_URL, headers=headers, files={"file": image_bytes})
-    if response.status_code == 200:
-        result = response.json()
-        return result[0]['generated_text']
-    else:
-        return f"Error generating caption: {response.text}"

+# import requests
+# import base64
+# import os
+# hf_token = os.environ.get("HUGGINGFACE_API_TOKEN")
+# API_URL = "https://api-inference.huggingface.co/models/nlpconnect/vit-gpt2-image-captioning"
+# headers = {
+#     "Authorization": f"Bearer {hf_token}"
+# }
+# def generateCaption(image_path):
+#     with open(image_path, "rb") as image_file:
+#         image_bytes = image_file.read()
+#     response = requests.post(API_URL, headers=headers, files={"file": image_bytes})
+#     if response.status_code == 200:
+#         result = response.json()
+#         return result[0]['generated_text']
+#     else:
+#         return f"Error generating caption: {response.text}"
+from PIL import Image
+from transformers import BlipProcessor , BlipForConditionalGeneration
+import torch
+processor = BlipProcessor.from_pretrained("./models/Caption")
+model = BlipForConditionalGeneration.from_pretrained("./models/Caption")
+def generateCaption(image_path):
+    image = Image.open(image_path).convert("RGB")
+    inputs = processor(images = image , return_tensors="pt")
+    output = model.generate(**inputs)
+    caption = processor.decode(output[0], skip_special_tokens = True)
+    return caption