commandeaw
/

DW-KhotTaeVL-2B-QueryFrames

@@ -20,7 +20,7 @@ def main() -> None:
         n_candidates=32,
     )
-    # Wild-mode example (no task taxonomy known).
     result = fv.answer_mcq(
         video_path="example.mp4",
         question="What does the chef do after pouring the oil into the pot?",
@@ -31,14 +31,15 @@ def main() -> None:
             "Adds salt to the pot",
         ],
     )
-    print("[wild mode]")
     print(f"  pred         : {result['pred']}")
     print(f"  raw output   : {result['raw']!r}")
     print(f"  frames used  : {result['frames_used']}")
     print(f"  CLIP latency : {result['latency_clip_s']} s")
     print(f"  GEN  latency : {result['latency_gen_s']} s")
-    # Task-aware example (when task taxonomy is provided, e.g. Video-MME).
     result2 = fv.answer_mcq(
         video_path="example.mp4",
         question="What is happening to the cabbage in the frying pan?",
@@ -50,7 +51,7 @@ def main() -> None:
         ],
         task_type="Object Reasoning",  # → uniform-fallback path
     )
-    print("\n[task-aware mode]")
     print(f"  pred         : {result2['pred']}")
     print(f"  frames used  : {result2['frames_used']}")  # 'uniform_fallback'

         n_candidates=32,
     )
+    # MCQ mode (no task_type) — default.
     result = fv.answer_mcq(
         video_path="example.mp4",
         question="What does the chef do after pouring the oil into the pot?",
             "Adds salt to the pot",
         ],
     )
+    print("[MCQ mode (no task_type)]")
     print(f"  pred         : {result['pred']}")
     print(f"  raw output   : {result['raw']!r}")
     print(f"  frames used  : {result['frames_used']}")
     print(f"  CLIP latency : {result['latency_clip_s']} s")
     print(f"  GEN  latency : {result['latency_gen_s']} s")
+    # Task-aware MCQ mode (when a task taxonomy is supplied, e.g. by
+    # Video-MME or by an operational workflow).
     result2 = fv.answer_mcq(
         video_path="example.mp4",
         question="What is happening to the cabbage in the frying pan?",
         ],
         task_type="Object Reasoning",  # → uniform-fallback path
     )
+    print("\n[Task-aware MCQ mode]")
     print(f"  pred         : {result2['pred']}")
     print(f"  frames used  : {result2['frames_used']}")  # 'uniform_fallback'