Spaces:
Sleeping
Sleeping
Update runtime_intentbench.py
Browse files- runtime_intentbench.py +16 -3
runtime_intentbench.py
CHANGED
|
@@ -345,6 +345,8 @@ class RemoteAPIBackend(InferenceBackend):
|
|
| 345 |
"message": "Collector finished via remote API.",
|
| 346 |
"backend_mode": self.mode,
|
| 347 |
"collector_summary": payload.get("collector_summary", ""),
|
|
|
|
|
|
|
| 348 |
}
|
| 349 |
if payload.get("planner_decision"):
|
| 350 |
yield {
|
|
@@ -352,7 +354,9 @@ class RemoteAPIBackend(InferenceBackend):
|
|
| 352 |
"message": "Planner finished via remote API.",
|
| 353 |
"backend_mode": self.mode,
|
| 354 |
"planner_decision": payload.get("planner_decision", ""),
|
|
|
|
| 355 |
"grounder_span_text": payload.get("grounder_span", ""),
|
|
|
|
| 356 |
}
|
| 357 |
if payload.get("grounder_span"):
|
| 358 |
yield {
|
|
@@ -360,20 +364,25 @@ class RemoteAPIBackend(InferenceBackend):
|
|
| 360 |
"message": "Grounder finished via remote API.",
|
| 361 |
"backend_mode": self.mode,
|
| 362 |
"grounder_span_text": payload.get("grounder_span", ""),
|
|
|
|
| 363 |
"grounded_video": payload.get("highlight_clip_path"),
|
|
|
|
| 364 |
}
|
| 365 |
yield {
|
| 366 |
"stage": "answer",
|
| 367 |
"message": "Answer received from remote API.",
|
| 368 |
"backend_mode": self.mode,
|
| 369 |
"final_answer": payload.get("final_answer", ""),
|
| 370 |
-
"answer_raw": payload.get("answer_raw", ""),
|
|
|
|
| 371 |
}
|
| 372 |
yield {
|
| 373 |
"stage": "review",
|
| 374 |
"message": "Review received from remote API.",
|
| 375 |
"backend_mode": self.mode,
|
| 376 |
"review_summary": payload.get("review_summary", ""),
|
|
|
|
|
|
|
| 377 |
}
|
| 378 |
yield {
|
| 379 |
"stage": "done",
|
|
@@ -652,6 +661,7 @@ class CPUFallbackBackend(LocalQwenVLBackend):
|
|
| 652 |
"message": "Collector finished.",
|
| 653 |
"backend_mode": self.mode,
|
| 654 |
"collector_summary": collector_summary,
|
|
|
|
| 655 |
"raw_prompt": format_messages_markdown("Collector Input", collector_messages),
|
| 656 |
}
|
| 657 |
|
|
@@ -672,14 +682,14 @@ class CPUFallbackBackend(LocalQwenVLBackend):
|
|
| 672 |
planner_text = (
|
| 673 |
f"Use Grounder: {use_grounder}\n"
|
| 674 |
f"Grounding Query: {grounding_query or '-'}\n"
|
| 675 |
-
f"Reason: {planner_json.get('reason', '-')}
|
| 676 |
-
f"Raw:\n{planner_raw}"
|
| 677 |
)
|
| 678 |
yield {
|
| 679 |
"stage": "planner",
|
| 680 |
"message": "Planner finished.",
|
| 681 |
"backend_mode": self.mode,
|
| 682 |
"planner_decision": planner_text,
|
|
|
|
| 683 |
"raw_prompt": format_messages_markdown("Planner Input", planner_messages),
|
| 684 |
}
|
| 685 |
|
|
@@ -712,6 +722,7 @@ class CPUFallbackBackend(LocalQwenVLBackend):
|
|
| 712 |
"message": "Grounder finished.",
|
| 713 |
"backend_mode": self.mode,
|
| 714 |
"grounder_span_text": grounded_span_text,
|
|
|
|
| 715 |
"grounded_video": grounded_video,
|
| 716 |
"raw_prompt": format_messages_markdown("Grounder Input", grounder_messages),
|
| 717 |
}
|
|
@@ -721,6 +732,7 @@ class CPUFallbackBackend(LocalQwenVLBackend):
|
|
| 721 |
"message": "Grounder skipped.",
|
| 722 |
"backend_mode": self.mode,
|
| 723 |
"grounder_span_text": grounded_span_text,
|
|
|
|
| 724 |
"grounded_video": None,
|
| 725 |
}
|
| 726 |
|
|
@@ -760,6 +772,7 @@ class CPUFallbackBackend(LocalQwenVLBackend):
|
|
| 760 |
"message": "Review finished.",
|
| 761 |
"backend_mode": self.mode,
|
| 762 |
"review_summary": review_summary,
|
|
|
|
| 763 |
"raw_prompt": format_messages_markdown("Review Input", review_messages),
|
| 764 |
}
|
| 765 |
yield {
|
|
|
|
| 345 |
"message": "Collector finished via remote API.",
|
| 346 |
"backend_mode": self.mode,
|
| 347 |
"collector_summary": payload.get("collector_summary", ""),
|
| 348 |
+
"collector_raw": payload.get("collector_raw", payload.get("collector_summary", "")),
|
| 349 |
+
"raw_prompt": payload.get("collector_prompt", ""),
|
| 350 |
}
|
| 351 |
if payload.get("planner_decision"):
|
| 352 |
yield {
|
|
|
|
| 354 |
"message": "Planner finished via remote API.",
|
| 355 |
"backend_mode": self.mode,
|
| 356 |
"planner_decision": payload.get("planner_decision", ""),
|
| 357 |
+
"planner_raw": payload.get("planner_raw", payload.get("planner_decision", "")),
|
| 358 |
"grounder_span_text": payload.get("grounder_span", ""),
|
| 359 |
+
"raw_prompt": payload.get("planner_prompt", ""),
|
| 360 |
}
|
| 361 |
if payload.get("grounder_span"):
|
| 362 |
yield {
|
|
|
|
| 364 |
"message": "Grounder finished via remote API.",
|
| 365 |
"backend_mode": self.mode,
|
| 366 |
"grounder_span_text": payload.get("grounder_span", ""),
|
| 367 |
+
"grounder_raw": payload.get("grounder_raw", payload.get("grounder_span", "")),
|
| 368 |
"grounded_video": payload.get("highlight_clip_path"),
|
| 369 |
+
"raw_prompt": payload.get("grounder_prompt", ""),
|
| 370 |
}
|
| 371 |
yield {
|
| 372 |
"stage": "answer",
|
| 373 |
"message": "Answer received from remote API.",
|
| 374 |
"backend_mode": self.mode,
|
| 375 |
"final_answer": payload.get("final_answer", ""),
|
| 376 |
+
"answer_raw": payload.get("answer_raw", payload.get("final_answer", "")),
|
| 377 |
+
"raw_prompt": payload.get("answer_prompt", ""),
|
| 378 |
}
|
| 379 |
yield {
|
| 380 |
"stage": "review",
|
| 381 |
"message": "Review received from remote API.",
|
| 382 |
"backend_mode": self.mode,
|
| 383 |
"review_summary": payload.get("review_summary", ""),
|
| 384 |
+
"review_raw": payload.get("review_raw", payload.get("review_summary", "")),
|
| 385 |
+
"raw_prompt": payload.get("review_prompt", ""),
|
| 386 |
}
|
| 387 |
yield {
|
| 388 |
"stage": "done",
|
|
|
|
| 661 |
"message": "Collector finished.",
|
| 662 |
"backend_mode": self.mode,
|
| 663 |
"collector_summary": collector_summary,
|
| 664 |
+
"collector_raw": collector_summary,
|
| 665 |
"raw_prompt": format_messages_markdown("Collector Input", collector_messages),
|
| 666 |
}
|
| 667 |
|
|
|
|
| 682 |
planner_text = (
|
| 683 |
f"Use Grounder: {use_grounder}\n"
|
| 684 |
f"Grounding Query: {grounding_query or '-'}\n"
|
| 685 |
+
f"Reason: {planner_json.get('reason', '-')}"
|
|
|
|
| 686 |
)
|
| 687 |
yield {
|
| 688 |
"stage": "planner",
|
| 689 |
"message": "Planner finished.",
|
| 690 |
"backend_mode": self.mode,
|
| 691 |
"planner_decision": planner_text,
|
| 692 |
+
"planner_raw": planner_raw,
|
| 693 |
"raw_prompt": format_messages_markdown("Planner Input", planner_messages),
|
| 694 |
}
|
| 695 |
|
|
|
|
| 722 |
"message": "Grounder finished.",
|
| 723 |
"backend_mode": self.mode,
|
| 724 |
"grounder_span_text": grounded_span_text,
|
| 725 |
+
"grounder_raw": grounder_raw,
|
| 726 |
"grounded_video": grounded_video,
|
| 727 |
"raw_prompt": format_messages_markdown("Grounder Input", grounder_messages),
|
| 728 |
}
|
|
|
|
| 732 |
"message": "Grounder skipped.",
|
| 733 |
"backend_mode": self.mode,
|
| 734 |
"grounder_span_text": grounded_span_text,
|
| 735 |
+
"grounder_raw": grounded_span_text,
|
| 736 |
"grounded_video": None,
|
| 737 |
}
|
| 738 |
|
|
|
|
| 772 |
"message": "Review finished.",
|
| 773 |
"backend_mode": self.mode,
|
| 774 |
"review_summary": review_summary,
|
| 775 |
+
"review_raw": review_raw,
|
| 776 |
"raw_prompt": format_messages_markdown("Review Input", review_messages),
|
| 777 |
}
|
| 778 |
yield {
|