Spaces:

JetBrains-Research
/

SWE-bench-Costs-Calculator

Running

IgorSlinko commited on 1 day ago

Commit

0b7bbfd

1 Parent(s): f734731

Rename to SWE-bench Costs Calculator, open all accordions by default (v0.3.44)

- Fix ONE TRAJECTORY graphs appearing on first Load & Analyze
- Open all accordion sections by default
- Rename app title to "SWE-bench Costs Calculator"

Files changed (1) hide show

app.py +15 -16

app.py CHANGED Viewed

@@ -1839,7 +1839,7 @@ def build_app():
         """)
         trajectories_state = gr.State(None)
-        gr.Markdown("# 🧮 SWE-bench analytics tool `v0.3.43`")
         gr.Markdown("### *Calculate cost savings with different routing strategies.*")
         gr.Markdown("## 🎯 Select a base model for cost analysis (click a row)")
@@ -1861,12 +1861,12 @@ def build_app():
                             plot_steps = gr.Plot(label="Distribution of API Calls (Steps) per Trajectory")
                             plot_cost = gr.Plot(label="Distribution of Cost Reported by Leaderboard ($)")
-                    with gr.Accordion("Token counts REPORTED in the metadata of .traj files [AGGREGATED ALL]", open=False):
                         with gr.Row():
                             plot_tokens_meta = gr.Plot(label="Total Tokens by Type")
                             plot_tokens_cost_meta = gr.Plot(label="Total Cost by Token Type ($)")
-                    with gr.Accordion("Token counts REPORTED in the metadata of .traj files [AGGREGATED BY TRAJECTORY]", open=False):
                         with gr.Row():
                             plot_stacked_meta = gr.Plot(label="Tokens per Trajectory (stacked)")
                         with gr.Row():
@@ -1880,18 +1880,18 @@ def build_app():
                         with gr.Row():
                             single_traj_meta_cost_plot = gr.Plot(label="Cost per Step (stacked) ($)")
-                    with gr.Accordion("Token counts CALCULATED from .traj files [AGGREGATED ALL]", open=False):
                         with gr.Row():
                             plot_tokens_calc = gr.Plot(label="Total Tokens by Type")
                             plot_tokens_cost_calc = gr.Plot(label="Total Cost by Token Type ($)")
-                    with gr.Accordion("Token counts CALCULATED from .traj files [AGGREGATED BY TRAJECTORY]", open=False):
                         with gr.Row():
                             plot_stacked_calc = gr.Plot(label="Tokens per Trajectory (stacked)")
                         with gr.Row():
                             plot_cost_breakdown_calc = gr.Plot(label="Cost per Trajectory")
-                    with gr.Accordion("Token counts CALCULATED from .traj files [ONE TRAJECTORY]", open=False, visible=False) as single_traj_accordion:
                         with gr.Row():
                             single_traj_dropdown = gr.Dropdown(label="Select Issue", choices=[], interactive=True)
                         with gr.Row():
@@ -2889,6 +2889,13 @@ def build_app():
             first_meta_issue = meta_issue_ids[0] if meta_issue_ids else None
             has_meta_steps = len(meta_issue_ids) > 0
             fig_single_traj_meta = None
             fig_single_traj_meta_cost = None
             if first_meta_issue and first_meta_issue in metadata_steps:
@@ -2907,8 +2914,8 @@ def build_app():
                 gr.update(visible=True),
                 gr.update(visible=True),
                 gr.update(choices=issue_ids, value=first_issue),
-                gr.update(),
-                gr.update(),
                 gr.update(visible=has_meta_steps),
                 gr.update(choices=meta_issue_ids, value=first_meta_issue),
                 fig_single_traj_meta,
@@ -2957,14 +2964,6 @@ def build_app():
                 single_traj_meta_plot,
                 single_traj_meta_cost_plot,
             ],
-        ).then(
-            fn=on_single_traj_select,
-            inputs=[trajectories_state, single_traj_dropdown, price_input, price_cache_read, price_cache_creation, price_completion, thinking_overhead, use_cache],
-            outputs=[single_traj_plot, single_traj_cost_plot],
-        ).then(
-            fn=on_single_traj_meta_select,
-            inputs=[trajectories_state, single_traj_meta_dropdown, price_input, price_cache_read, price_cache_creation, price_completion],
-            outputs=[single_traj_meta_plot, single_traj_meta_cost_plot],
         )
         def recalculate_costs(state_data, input_price, cache_read_price, cache_creation_price, completion_price, overhead, with_cache):

         """)
         trajectories_state = gr.State(None)
+        gr.Markdown("# 🧮 SWE-bench Costs Calculator `v0.3.44`")
         gr.Markdown("### *Calculate cost savings with different routing strategies.*")
         gr.Markdown("## 🎯 Select a base model for cost analysis (click a row)")
                             plot_steps = gr.Plot(label="Distribution of API Calls (Steps) per Trajectory")
                             plot_cost = gr.Plot(label="Distribution of Cost Reported by Leaderboard ($)")
+                    with gr.Accordion("Token counts REPORTED in the metadata of .traj files [AGGREGATED ALL]", open=True):
                         with gr.Row():
                             plot_tokens_meta = gr.Plot(label="Total Tokens by Type")
                             plot_tokens_cost_meta = gr.Plot(label="Total Cost by Token Type ($)")
+                    with gr.Accordion("Token counts REPORTED in the metadata of .traj files [AGGREGATED BY TRAJECTORY]", open=True):
                         with gr.Row():
                             plot_stacked_meta = gr.Plot(label="Tokens per Trajectory (stacked)")
                         with gr.Row():
                         with gr.Row():
                             single_traj_meta_cost_plot = gr.Plot(label="Cost per Step (stacked) ($)")
+                    with gr.Accordion("Token counts CALCULATED from .traj files [AGGREGATED ALL]", open=True):
                         with gr.Row():
                             plot_tokens_calc = gr.Plot(label="Total Tokens by Type")
                             plot_tokens_cost_calc = gr.Plot(label="Total Cost by Token Type ($)")
+                    with gr.Accordion("Token counts CALCULATED from .traj files [AGGREGATED BY TRAJECTORY]", open=True):
                         with gr.Row():
                             plot_stacked_calc = gr.Plot(label="Tokens per Trajectory (stacked)")
                         with gr.Row():
                             plot_cost_breakdown_calc = gr.Plot(label="Cost per Trajectory")
+                    with gr.Accordion("Token counts CALCULATED from .traj files [ONE TRAJECTORY]", open=True, visible=False) as single_traj_accordion:
                         with gr.Row():
                             single_traj_dropdown = gr.Dropdown(label="Select Issue", choices=[], interactive=True)
                         with gr.Row():
             first_meta_issue = meta_issue_ids[0] if meta_issue_ids else None
             has_meta_steps = len(meta_issue_ids) > 0
+            fig_single_traj = None
+            fig_single_traj_cost = None
+            if first_issue and first_issue in trajectory_steps:
+                calc_steps = trajectory_steps[first_issue]
+                fig_single_traj = create_single_trajectory_chart(calc_steps, overhead, with_cache)
+                fig_single_traj_cost = create_single_trajectory_cost_chart(calc_steps, input_price, cache_read_price, cache_creation_price, completion_price, overhead, with_cache)
             fig_single_traj_meta = None
             fig_single_traj_meta_cost = None
             if first_meta_issue and first_meta_issue in metadata_steps:
                 gr.update(visible=True),
                 gr.update(visible=True),
                 gr.update(choices=issue_ids, value=first_issue),
+                fig_single_traj,
+                fig_single_traj_cost,
                 gr.update(visible=has_meta_steps),
                 gr.update(choices=meta_issue_ids, value=first_meta_issue),
                 fig_single_traj_meta,
                 single_traj_meta_plot,
                 single_traj_meta_cost_plot,
             ],
         )
         def recalculate_costs(state_data, input_price, cache_read_price, cache_creation_price, completion_price, overhead, with_cache):