Spaces:

Kazel
/

collarvision

Paused

Kazel commited on Mar 31, 2025

Commit

5b84e6f

verified ·

1 Parent(s): 5fd9575

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,6 +4,7 @@ import threading
 import torch
 from transformers import BlipProcessor, BlipForConditionalGeneration
 from PIL import Image
 # Initialize the webcam
 cap = cv2.VideoCapture(0)
@@ -11,7 +12,7 @@ cap = cv2.VideoCapture(0)
 # Load the Hugging Face model and processor
 processor = BlipProcessor.from_pretrained("Salesforce/blip-vqa-base")
 model = BlipForConditionalGeneration.from_pretrained("Salesforce/blip-vqa-base").to("cuda" if torch.cuda.is_available() else "cpu")
 def query_the_image(query: str, image_data: bytes):
     try:
         image = Image.open(io.BytesIO(image_data)).convert("RGB")
@@ -21,20 +22,20 @@ def query_the_image(query: str, image_data: bytes):
         return answer
     except Exception as e:
         return f"Error: {e}"
 def get_frame():
     ret, frame = cap.read()
     if not ret:
         return None
     _, buffer = cv2.imencode('.jpg', frame)
     return buffer.tobytes()
 def process_image(prompt):
     frame_data = get_frame()
     if frame_data:
         return query_the_image(prompt, frame_data)
     return "Error capturing image"
 def video_feed():
     while True:
         ret, frame = cap.read()

 import torch
 from transformers import BlipProcessor, BlipForConditionalGeneration
 from PIL import Image
+import spaces
 # Initialize the webcam
 cap = cv2.VideoCapture(0)
 # Load the Hugging Face model and processor
 processor = BlipProcessor.from_pretrained("Salesforce/blip-vqa-base")
 model = BlipForConditionalGeneration.from_pretrained("Salesforce/blip-vqa-base").to("cuda" if torch.cuda.is_available() else "cpu")
+@spaces.GPU
 def query_the_image(query: str, image_data: bytes):
     try:
         image = Image.open(io.BytesIO(image_data)).convert("RGB")
         return answer
     except Exception as e:
         return f"Error: {e}"
+@spaces.GPU
 def get_frame():
     ret, frame = cap.read()
     if not ret:
         return None
     _, buffer = cv2.imencode('.jpg', frame)
     return buffer.tobytes()
+@spaces.GPU
 def process_image(prompt):
     frame_data = get_frame()
     if frame_data:
         return query_the_image(prompt, frame_data)
     return "Error capturing image"
+@spaces.GPU
 def video_feed():
     while True:
         ret, frame = cap.read()