Spaces:

sming256
/

VideoAuto-R1_Demo

Running on Zero

sming256 commited on Jan 9

Commit

79e6f86

verified ·

1 Parent(s): 0618c41

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -98,9 +98,8 @@ class Qwen3VLAutoThinkDemo:
         self.model = Qwen3VLForConditionalGeneration.from_pretrained(
             model_path,
             dtype="bfloat16",
-            device_map="auto",
             attn_implementation="sdpa",
-        ).eval()
         self.processor = AutoProcessor.from_pretrained(model_path)
         self.tokenizer = AutoTokenizer.from_pretrained(model_path)
@@ -200,8 +199,8 @@ class Qwen3VLAutoThinkDemo:
         Returns:
             Dictionary containing response and metadata
         """
-        if self.model.device.type != "cuda":
-            self.model.to("cuda")
         # Prepare message
         message = [{"role": "system", "content": self.system_prompt}]

         self.model = Qwen3VLForConditionalGeneration.from_pretrained(
             model_path,
             dtype="bfloat16",
             attn_implementation="sdpa",
+        ).to('cuda').eval()
         self.processor = AutoProcessor.from_pretrained(model_path)
         self.tokenizer = AutoTokenizer.from_pretrained(model_path)
         Returns:
             Dictionary containing response and metadata
         """
+        # if self.model.device.type != "cuda":
+            # self.model.to("cuda")
         # Prepare message
         message = [{"role": "system", "content": self.system_prompt}]