Spaces:

GF-John
/

video-caption

Running on Zero

John Ho commited on Jul 23, 2025

Commit

8b3dcea

1 Parent(s): 1679d51

make sure DTYPE is used

Files changed (1) hide show

app.py CHANGED Viewed

@@ -49,14 +49,14 @@ def load_model(
     model = (
         Qwen2_5_VLForConditionalGeneration.from_pretrained(
             model_name,
-            torch_dtype=torch.bfloat16,
             attn_implementation="flash_attention_2",
-            device_map="auto",
         )
         if use_flash_attention
         else Qwen2_5_VLForConditionalGeneration.from_pretrained(
             model_name,
-            torch_dtype=torch.bfloat16,  # "auto",
             device_map=DEVICE,
         )
     )
@@ -71,7 +71,10 @@ def inference(
 ):
     # default processor
     processor = AutoProcessor.from_pretrained(
-        "Qwen/Qwen2.5-VL-7B-Instruct", device_map=DEVICE, use_fast=True
     )
     model = load_model(use_flash_attention=use_flash_attention)
     fps = get_fps_ffmpeg(video_path)

     model = (
         Qwen2_5_VLForConditionalGeneration.from_pretrained(
             model_name,
+            torch_dtype=DTYPE,  # torch.bfloat16,
             attn_implementation="flash_attention_2",
+            device_map=DEVICE,  # "auto",
         )
         if use_flash_attention
         else Qwen2_5_VLForConditionalGeneration.from_pretrained(
             model_name,
+            torch_dtype=DTYPE,  # "auto",
             device_map=DEVICE,
         )
     )
 ):
     # default processor
     processor = AutoProcessor.from_pretrained(
+        "Qwen/Qwen2.5-VL-7B-Instruct",
+        device_map=DEVICE,
+        use_fast=True,
+        torch_dtype=DTYPE,
     )
     model = load_model(use_flash_attention=use_flash_attention)
     fps = get_fps_ffmpeg(video_path)