pose-like / src /generate_caption.py
huggysynuo's picture
Update src/generate_caption.py
b857d30 verified
from transformers import BlipProcessor, BlipForConditionalGeneration
from PIL import Image
import torch
import os
import streamlit as st
import tempfile
# μ•ˆμ „ν•œ μΊμ‹œ 디렉토리 μ§€μ •
HF_CACHE_DIR = os.path.join(tempfile.gettempdir(), "hf_cache")
os.makedirs(HF_CACHE_DIR, exist_ok=True)
# ν™˜κ²½ λ³€μˆ˜ μ„€μ • (ONLY HF_HOME)
os.environ["HF_HOME"] = HF_CACHE_DIR
# transformers.loadμ—μ„œ cache_dir μ§€μ •
processor = BlipProcessor.from_pretrained("Salesforce/blip-image-captioning-base", cache_dir=HF_CACHE_DIR)
model = BlipForConditionalGeneration.from_pretrained("Salesforce/blip-image-captioning-base", cache_dir=HF_CACHE_DIR)
def generate_caption(image_path):
processor, model = load_blip_model()
image = Image.open(image_path).convert("RGB")
inputs = processor(image, return_tensors="pt")
with torch.no_grad(): # βœ… μ„±λŠ₯ μ΅œμ ν™” (inference μ‹œ gradient λΆˆν•„μš”)
out = model.generate(**inputs)
return processor.decode(out[0], skip_special_tokens=True)