Harry-1234 commited on
Commit
65dbb57
·
verified ·
1 Parent(s): 943108c

Update runtime_intentbench.py

Browse files
Files changed (1) hide show
  1. runtime_intentbench.py +16 -3
runtime_intentbench.py CHANGED
@@ -345,6 +345,8 @@ class RemoteAPIBackend(InferenceBackend):
345
  "message": "Collector finished via remote API.",
346
  "backend_mode": self.mode,
347
  "collector_summary": payload.get("collector_summary", ""),
 
 
348
  }
349
  if payload.get("planner_decision"):
350
  yield {
@@ -352,7 +354,9 @@ class RemoteAPIBackend(InferenceBackend):
352
  "message": "Planner finished via remote API.",
353
  "backend_mode": self.mode,
354
  "planner_decision": payload.get("planner_decision", ""),
 
355
  "grounder_span_text": payload.get("grounder_span", ""),
 
356
  }
357
  if payload.get("grounder_span"):
358
  yield {
@@ -360,20 +364,25 @@ class RemoteAPIBackend(InferenceBackend):
360
  "message": "Grounder finished via remote API.",
361
  "backend_mode": self.mode,
362
  "grounder_span_text": payload.get("grounder_span", ""),
 
363
  "grounded_video": payload.get("highlight_clip_path"),
 
364
  }
365
  yield {
366
  "stage": "answer",
367
  "message": "Answer received from remote API.",
368
  "backend_mode": self.mode,
369
  "final_answer": payload.get("final_answer", ""),
370
- "answer_raw": payload.get("answer_raw", ""),
 
371
  }
372
  yield {
373
  "stage": "review",
374
  "message": "Review received from remote API.",
375
  "backend_mode": self.mode,
376
  "review_summary": payload.get("review_summary", ""),
 
 
377
  }
378
  yield {
379
  "stage": "done",
@@ -652,6 +661,7 @@ class CPUFallbackBackend(LocalQwenVLBackend):
652
  "message": "Collector finished.",
653
  "backend_mode": self.mode,
654
  "collector_summary": collector_summary,
 
655
  "raw_prompt": format_messages_markdown("Collector Input", collector_messages),
656
  }
657
 
@@ -672,14 +682,14 @@ class CPUFallbackBackend(LocalQwenVLBackend):
672
  planner_text = (
673
  f"Use Grounder: {use_grounder}\n"
674
  f"Grounding Query: {grounding_query or '-'}\n"
675
- f"Reason: {planner_json.get('reason', '-')}\n\n"
676
- f"Raw:\n{planner_raw}"
677
  )
678
  yield {
679
  "stage": "planner",
680
  "message": "Planner finished.",
681
  "backend_mode": self.mode,
682
  "planner_decision": planner_text,
 
683
  "raw_prompt": format_messages_markdown("Planner Input", planner_messages),
684
  }
685
 
@@ -712,6 +722,7 @@ class CPUFallbackBackend(LocalQwenVLBackend):
712
  "message": "Grounder finished.",
713
  "backend_mode": self.mode,
714
  "grounder_span_text": grounded_span_text,
 
715
  "grounded_video": grounded_video,
716
  "raw_prompt": format_messages_markdown("Grounder Input", grounder_messages),
717
  }
@@ -721,6 +732,7 @@ class CPUFallbackBackend(LocalQwenVLBackend):
721
  "message": "Grounder skipped.",
722
  "backend_mode": self.mode,
723
  "grounder_span_text": grounded_span_text,
 
724
  "grounded_video": None,
725
  }
726
 
@@ -760,6 +772,7 @@ class CPUFallbackBackend(LocalQwenVLBackend):
760
  "message": "Review finished.",
761
  "backend_mode": self.mode,
762
  "review_summary": review_summary,
 
763
  "raw_prompt": format_messages_markdown("Review Input", review_messages),
764
  }
765
  yield {
 
345
  "message": "Collector finished via remote API.",
346
  "backend_mode": self.mode,
347
  "collector_summary": payload.get("collector_summary", ""),
348
+ "collector_raw": payload.get("collector_raw", payload.get("collector_summary", "")),
349
+ "raw_prompt": payload.get("collector_prompt", ""),
350
  }
351
  if payload.get("planner_decision"):
352
  yield {
 
354
  "message": "Planner finished via remote API.",
355
  "backend_mode": self.mode,
356
  "planner_decision": payload.get("planner_decision", ""),
357
+ "planner_raw": payload.get("planner_raw", payload.get("planner_decision", "")),
358
  "grounder_span_text": payload.get("grounder_span", ""),
359
+ "raw_prompt": payload.get("planner_prompt", ""),
360
  }
361
  if payload.get("grounder_span"):
362
  yield {
 
364
  "message": "Grounder finished via remote API.",
365
  "backend_mode": self.mode,
366
  "grounder_span_text": payload.get("grounder_span", ""),
367
+ "grounder_raw": payload.get("grounder_raw", payload.get("grounder_span", "")),
368
  "grounded_video": payload.get("highlight_clip_path"),
369
+ "raw_prompt": payload.get("grounder_prompt", ""),
370
  }
371
  yield {
372
  "stage": "answer",
373
  "message": "Answer received from remote API.",
374
  "backend_mode": self.mode,
375
  "final_answer": payload.get("final_answer", ""),
376
+ "answer_raw": payload.get("answer_raw", payload.get("final_answer", "")),
377
+ "raw_prompt": payload.get("answer_prompt", ""),
378
  }
379
  yield {
380
  "stage": "review",
381
  "message": "Review received from remote API.",
382
  "backend_mode": self.mode,
383
  "review_summary": payload.get("review_summary", ""),
384
+ "review_raw": payload.get("review_raw", payload.get("review_summary", "")),
385
+ "raw_prompt": payload.get("review_prompt", ""),
386
  }
387
  yield {
388
  "stage": "done",
 
661
  "message": "Collector finished.",
662
  "backend_mode": self.mode,
663
  "collector_summary": collector_summary,
664
+ "collector_raw": collector_summary,
665
  "raw_prompt": format_messages_markdown("Collector Input", collector_messages),
666
  }
667
 
 
682
  planner_text = (
683
  f"Use Grounder: {use_grounder}\n"
684
  f"Grounding Query: {grounding_query or '-'}\n"
685
+ f"Reason: {planner_json.get('reason', '-')}"
 
686
  )
687
  yield {
688
  "stage": "planner",
689
  "message": "Planner finished.",
690
  "backend_mode": self.mode,
691
  "planner_decision": planner_text,
692
+ "planner_raw": planner_raw,
693
  "raw_prompt": format_messages_markdown("Planner Input", planner_messages),
694
  }
695
 
 
722
  "message": "Grounder finished.",
723
  "backend_mode": self.mode,
724
  "grounder_span_text": grounded_span_text,
725
+ "grounder_raw": grounder_raw,
726
  "grounded_video": grounded_video,
727
  "raw_prompt": format_messages_markdown("Grounder Input", grounder_messages),
728
  }
 
732
  "message": "Grounder skipped.",
733
  "backend_mode": self.mode,
734
  "grounder_span_text": grounded_span_text,
735
+ "grounder_raw": grounded_span_text,
736
  "grounded_video": None,
737
  }
738
 
 
772
  "message": "Review finished.",
773
  "backend_mode": self.mode,
774
  "review_summary": review_summary,
775
+ "review_raw": review_raw,
776
  "raw_prompt": format_messages_markdown("Review Input", review_messages),
777
  }
778
  yield {