Solves 500 Errors For Some Users

#1
by Tonic - opened
This view is limited to 50 files because it contains too many changes. See the raw diff here.
Files changed (50) hide show
  1. .gitattributes +1 -1
  2. .gitignore +13 -1
  3. .pre-commit-config.yaml +53 -0
  4. .streamlit/config.toml +0 -2
  5. CLAUDE.md +0 -82
  6. Dockerfile +0 -21
  7. Makefile +13 -0
  8. README.md +36 -12
  9. app.py +97 -0
  10. fev-leaderboard-app.py +0 -9
  11. pages/about.py +0 -19
  12. pages/fev_bench.py +0 -284
  13. pyproject.toml +13 -12
  14. requirements.txt +8 -4
  15. save_tables.py +0 -241
  16. src/about.py +50 -0
  17. src/colors.py +0 -6
  18. src/custom_html_js.py +99 -0
  19. src/formatting.py +31 -0
  20. src/streamlit_app.py +0 -9
  21. src/strings.py +0 -114
  22. src/task_groups.py +0 -266
  23. src/utils.py +0 -413
  24. tables/domain_cloud/leaderboard_MASE.csv +0 -29
  25. tables/domain_cloud/leaderboard_SQL.csv +0 -29
  26. tables/domain_cloud/leaderboard_WAPE.csv +0 -29
  27. tables/domain_cloud/leaderboard_WQL.csv +0 -29
  28. tables/domain_cloud/pairwise_MASE.csv +0 -290
  29. tables/domain_cloud/pairwise_SQL.csv +0 -290
  30. tables/domain_cloud/pairwise_WAPE.csv +0 -290
  31. tables/domain_cloud/pairwise_WQL.csv +0 -290
  32. tables/domain_econ/leaderboard_MASE.csv +0 -29
  33. tables/domain_econ/leaderboard_SQL.csv +0 -29
  34. tables/domain_econ/leaderboard_WAPE.csv +0 -29
  35. tables/domain_econ/leaderboard_WQL.csv +0 -29
  36. tables/domain_econ/pairwise_MASE.csv +0 -290
  37. tables/domain_econ/pairwise_SQL.csv +0 -290
  38. tables/domain_econ/pairwise_WAPE.csv +0 -290
  39. tables/domain_econ/pairwise_WQL.csv +0 -257
  40. tables/domain_energy/leaderboard_MASE.csv +0 -29
  41. tables/domain_energy/leaderboard_SQL.csv +0 -29
  42. tables/domain_energy/leaderboard_WAPE.csv +0 -29
  43. tables/domain_energy/leaderboard_WQL.csv +0 -29
  44. tables/domain_energy/pairwise_MASE.csv +0 -257
  45. tables/domain_energy/pairwise_SQL.csv +0 -257
  46. tables/domain_energy/pairwise_WAPE.csv +0 -257
  47. tables/domain_energy/pairwise_WQL.csv +0 -257
  48. tables/domain_health/leaderboard_MASE.csv +0 -29
  49. tables/domain_health/leaderboard_SQL.csv +0 -29
  50. tables/domain_health/leaderboard_WAPE.csv +0 -29
.gitattributes CHANGED
@@ -25,7 +25,6 @@
25
  *.safetensors filter=lfs diff=lfs merge=lfs -text
26
  saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
  *.tar.* filter=lfs diff=lfs merge=lfs -text
28
- *.tar filter=lfs diff=lfs merge=lfs -text
29
  *.tflite filter=lfs diff=lfs merge=lfs -text
30
  *.tgz filter=lfs diff=lfs merge=lfs -text
31
  *.wasm filter=lfs diff=lfs merge=lfs -text
@@ -33,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
25
  *.safetensors filter=lfs diff=lfs merge=lfs -text
26
  saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
  *.tar.* filter=lfs diff=lfs merge=lfs -text
 
28
  *.tflite filter=lfs diff=lfs merge=lfs -text
29
  *.tgz filter=lfs diff=lfs merge=lfs -text
30
  *.wasm filter=lfs diff=lfs merge=lfs -text
 
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ scale-hf-logo.png filter=lfs diff=lfs merge=lfs -text
.gitignore CHANGED
@@ -1 +1,13 @@
1
- __pycache__
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ auto_evals/
2
+ venv/
3
+ __pycache__/
4
+ .env
5
+ .ipynb_checkpoints
6
+ *ipynb
7
+ .vscode/
8
+
9
+ eval-queue/
10
+ eval-results/
11
+ eval-queue-bk/
12
+ eval-results-bk/
13
+ logs/
.pre-commit-config.yaml ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Copyright (c) 2022, NVIDIA CORPORATION. All rights reserved.
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+
15
+ default_language_version:
16
+ python: python3
17
+
18
+ ci:
19
+ autofix_prs: true
20
+ autoupdate_commit_msg: '[pre-commit.ci] pre-commit suggestions'
21
+ autoupdate_schedule: quarterly
22
+
23
+ repos:
24
+ - repo: https://github.com/pre-commit/pre-commit-hooks
25
+ rev: v4.3.0
26
+ hooks:
27
+ - id: check-yaml
28
+ - id: check-case-conflict
29
+ - id: detect-private-key
30
+ - id: check-added-large-files
31
+ args: ['--maxkb=1000']
32
+ - id: requirements-txt-fixer
33
+ - id: end-of-file-fixer
34
+ - id: trailing-whitespace
35
+
36
+ - repo: https://github.com/PyCQA/isort
37
+ rev: 5.12.0
38
+ hooks:
39
+ - id: isort
40
+ name: Format imports
41
+
42
+ - repo: https://github.com/psf/black
43
+ rev: 22.12.0
44
+ hooks:
45
+ - id: black
46
+ name: Format code
47
+ additional_dependencies: ['click==8.0.2']
48
+
49
+ - repo: https://github.com/charliermarsh/ruff-pre-commit
50
+ # Ruff version.
51
+ rev: 'v0.0.267'
52
+ hooks:
53
+ - id: ruff
.streamlit/config.toml DELETED
@@ -1,2 +0,0 @@
1
- [theme]
2
- base = "light"
 
 
 
CLAUDE.md DELETED
@@ -1,82 +0,0 @@
1
- # CLAUDE.md
2
-
3
- This file provides guidance to Claude Code (claude.ai/code) when working with code in this repository.
4
-
5
- ## Project Overview
6
-
7
- fev-bench Leaderboard is a Streamlit web application displaying time series forecasting model evaluation results from the fev-bench benchmark. It evaluates 30+ forecasting models using multiple metrics (SQL, MASE, WQL, WAPE) across 100 benchmark tasks.
8
-
9
- ## Common Commands
10
-
11
- ```bash
12
- # Run the Streamlit app locally
13
- uv run streamlit run fev-leaderboard-app.py --server.port=8501 --server.address=0.0.0.0
14
-
15
- # Regenerate leaderboard tables from autogluon/fev repo (defaults to main branch)
16
- uv run python save_tables.py [commit] # e.g., uv run python save_tables.py abc123
17
-
18
- # Docker build and run
19
- docker build -t fev-leaderboard .
20
- docker run -p 8501:8501 fev-leaderboard
21
- ```
22
-
23
- Note: Use `uv run` prefix for all Python commands in this project.
24
-
25
- No test or lint frameworks are configured.
26
-
27
- ## Architecture
28
-
29
- ```
30
- fev-leaderboard-app.py # Main entry point (Streamlit multi-page router)
31
- save_tables.py # Generates pre-computed CSV tables from raw summaries
32
- pages/
33
- ├── fev_bench.py # Main leaderboard (100 tasks, loads from tables/)
34
- ├── chronos_bench_ii.py # Alternative leaderboard (27 tasks, fetches from GitHub)
35
- └── about.py # Help page with links
36
- src/
37
- ├── utils.py # Visualization, formatting, MODEL_CONFIG, color palette
38
- ├── strings.py # UI text, metric descriptions, paper citations
39
- └── task_groups.py # Task groupings by frequency and domain
40
- tables/ # Pre-generated CSVs
41
- ├── pivot_*.csv # Full pivot tables (filtered in app by task group)
42
- ├── summaries.csv # Raw evaluation summaries
43
- └── {group}/ # Subdirectories for each task group (full, mini, frequency_*, domain_*)
44
- ├── leaderboard_*.csv # Leaderboard tables per metric
45
- └── pairwise_*.csv # Pairwise comparison tables per metric
46
- ```
47
-
48
- **Data flow**: GitHub (autogluon/fev) → `save_tables.py` → pre-computed tables → `fev_bench.py` visualization
49
-
50
- ## Key Modules
51
-
52
- **`src/utils.py`**: Core module containing:
53
- - `MODEL_CONFIG`: Dict mapping model names to (huggingface_url, organization, is_zero_shot, model_type)
54
- - `ALL_METRICS`: Dict with SQL, MASE, WQL, WAPE definitions
55
- - `format_leaderboard()`, `construct_bar_chart()`, `construct_pairwise_chart()`, `construct_pivot_table()`: Styling functions
56
- - `COLORS`: Custom palette (purple, gold, silver, bronze)
57
-
58
- **`src/strings.py`**: Documentation strings for metric formulas, win rate/skill score calculations, imputation strategies
59
-
60
- ## Metrics
61
-
62
- | Metric | Type | Description |
63
- |--------|------|-------------|
64
- | SQL | Probabilistic | Scaled Quantile Loss (scale-invariant) |
65
- | MASE | Point | Mean Absolute Scaled Error (scale-invariant) |
66
- | WQL | Probabilistic | Weighted Quantile Loss (scale-dependent) |
67
- | WAPE | Point | Weighted Absolute Percentage Error (scale-dependent) |
68
-
69
- ## Model Types
70
-
71
- Models are categorized as DL (deep learning) or ST (statistical) in `MODEL_CONFIG`. This affects color-coding in visualizations (blue vs. orange).
72
-
73
- ## Imputation Strategy
74
-
75
- - **Failed tasks**: Replaced with Seasonal Naive scores
76
- - **Leaky tasks** (training corpus overlap for zero-shot models): Replaced with Chronos-Bolt scores
77
-
78
- ## External References
79
-
80
- - fev-bench paper: https://arxiv.org/abs/2509.26468
81
- - fev library docs: https://autogluon.github.io/fev/latest/
82
- - GitHub: https://github.com/autogluon/fev
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Dockerfile DELETED
@@ -1,21 +0,0 @@
1
- FROM python:3.13.5-slim
2
-
3
- RUN useradd -m -u 1000 user
4
- WORKDIR /app
5
-
6
- RUN apt-get update && apt-get install -y \
7
- build-essential \
8
- curl \
9
- git \
10
- && rm -rf /var/lib/apt/lists/*
11
-
12
- COPY --chown=user ./requirements.txt requirements.txt
13
- COPY --chown=user . /app
14
-
15
- RUN pip3 install -r requirements.txt
16
-
17
- EXPOSE 8501
18
-
19
- HEALTHCHECK CMD curl --fail http://localhost:8501/_stcore/health
20
-
21
- ENTRYPOINT ["streamlit", "run", "fev-leaderboard-app.py", "--server.port=8501", "--server.address=0.0.0.0"]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Makefile ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ .PHONY: style format
2
+
3
+
4
+ style:
5
+ python -m black --line-length 119 .
6
+ python -m isort .
7
+ ruff check --fix .
8
+
9
+
10
+ quality:
11
+ python -m black --check --line-length 119 .
12
+ python -m isort --check-only .
13
+ ruff check .
README.md CHANGED
@@ -1,20 +1,44 @@
1
  ---
2
- title: fev-bench
3
- emoji: 🏆
4
  colorFrom: green
5
  colorTo: indigo
6
- sdk: docker
7
- app_port: 8501
8
- tags:
9
- - streamlit
10
- pinned: false
11
- short_description: Forecast evaluation benchmark
12
  license: apache-2.0
13
  ---
14
 
15
- # Welcome to Streamlit!
16
 
17
- Edit `/src/streamlit_app.py` to customize this app to your heart's desire. :heart:
18
 
19
- If you have any questions, checkout our [documentation](https://docs.streamlit.io) and [community
20
- forums](https://discuss.streamlit.io).
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  ---
2
+ title: Fev Leaderboard
3
+ emoji: 🥇
4
  colorFrom: green
5
  colorTo: indigo
6
+ sdk: gradio
7
+ app_file: app.py
8
+ pinned: true
 
 
 
9
  license: apache-2.0
10
  ---
11
 
12
+ # Start the configuration
13
 
14
+ Most of the variables to change for a default leaderboard are in `src/env.py` (replace the path for your leaderboard) and `src/about.py` (for tasks).
15
 
16
+ Results files should have the following format and be stored as json files:
17
+ ```json
18
+ {
19
+ "config": {
20
+ "model_dtype": "torch.float16", # or torch.bfloat16 or 8bit or 4bit
21
+ "model_name": "path of the model on the hub: org/model",
22
+ "model_sha": "revision on the hub",
23
+ },
24
+ "results": {
25
+ "task_name": {
26
+ "metric_name": score,
27
+ },
28
+ "task_name2": {
29
+ "metric_name": score,
30
+ }
31
+ }
32
+ }
33
+ ```
34
+
35
+ Request files are created automatically by this tool.
36
+
37
+ If you encounter problem on the space, don't hesitate to restart it to remove the create eval-queue, eval-queue-bk, eval-results and eval-results-bk created folder.
38
+
39
+ # Code logic for more complex edits
40
+
41
+ You'll find
42
+ - the main table' columns names and properties in `src/display/utils.py`
43
+ - the logic to read all results and request files, then convert them in dataframe lines, in `src/leaderboard/read_evals.py`, and `src/populate.py`
44
+ - the logic to allow or filter submissions in `src/submission/submit.py` and `src/submission/check_validity.py`
app.py ADDED
@@ -0,0 +1,97 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import fev
2
+ import gradio as gr
3
+ import pandas as pd
4
+
5
+ from src import about
6
+ from src.custom_html_js import custom_css
7
+ from src.formatting import make_clickable_model
8
+
9
+ # Load the CSV data into a pandas DataFrame
10
+ df = pd.read_csv(
11
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/seasonal_naive.csv"
12
+ )
13
+
14
+
15
+ summary_urls = [
16
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/auto_arima.csv",
17
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/auto_ets.csv",
18
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/auto_theta.csv",
19
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/chronos_base.csv",
20
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/chronos_large.csv",
21
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/chronos_mini.csv",
22
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/chronos_small.csv",
23
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/chronos_tiny.csv",
24
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/chronos_bolt_base.csv",
25
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/chronos_bolt_mini.csv",
26
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/chronos_bolt_small.csv",
27
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/chronos_bolt_tiny.csv",
28
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/moirai_base.csv",
29
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/moirai_large.csv",
30
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/moirai_small.csv",
31
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/seasonal_naive.csv",
32
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/timesfm.csv",
33
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/timesfm-2.0.csv",
34
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/ttm-r2.csv",
35
+ "https://raw.githubusercontent.com/autogluon/fev/refs/heads/main/benchmarks/chronos_zeroshot/results/tirex.csv",
36
+ ]
37
+
38
+ rename_cols = {
39
+ "gmean_relative_error": "Average relative error",
40
+ "avg_rank": "Average rank",
41
+ "median_inference_time_s": "Median inference time (s)",
42
+ "training_corpus_overlap": "Training corpus overlap (%)",
43
+ }
44
+ selected_cols = list(rename_cols.keys())
45
+
46
+
47
+ def highlight_zeroshot(styler):
48
+ """Highlight training overlap for zero-shot models with bold green."""
49
+
50
+ def style_func(val):
51
+ if val == 0:
52
+ return "color: green; font-weight: bold"
53
+ else:
54
+ return "color: black"
55
+
56
+ return styler.map(style_func, subset=["Training corpus overlap (%)"])
57
+
58
+
59
+ leaderboards = {}
60
+ for metric in ["WQL", "MASE"]:
61
+ lb = fev.leaderboard(summary_urls, metric_column=metric)[selected_cols].rename(columns=rename_cols)
62
+ lb = lb.astype("float64").round(3).reset_index()
63
+ lb["Training corpus overlap (%)"] = (lb["Training corpus overlap (%)"] * 100).round(1)
64
+ lb["model_name"] = lb["model_name"].apply(make_clickable_model)
65
+ leaderboards[metric] = highlight_zeroshot(lb.style).format(precision=3)
66
+
67
+
68
+ with gr.Blocks(css=custom_css) as demo:
69
+ gr.HTML(about.TITLE)
70
+ gr.Markdown(about.INTRODUCTION_TEXT, elem_classes="markdown-text")
71
+
72
+ with gr.Tabs(elem_classes="tab-buttons"):
73
+ with gr.Tab("🏅 Chronos Benchmark II", id=0):
74
+ with gr.Column():
75
+ gr.Markdown(about.CHRONOS_BENCHMARK, elem_classes="markdown-text")
76
+ with gr.Tabs():
77
+ with gr.Tab("📊 Probabilistic forecast (WQL)"):
78
+ gr.Markdown("""Forecast accuracy measured by Weighted Quantile Loss.""")
79
+ gr.Dataframe(
80
+ value=leaderboards["WQL"],
81
+ datatype=["markdown", "number", "number", "number"],
82
+ interactive=False,
83
+ )
84
+
85
+ with gr.Tab("📈 Point forecast (MASE)"):
86
+ gr.Markdown("""Forecast accuracy measured by Mean Absolute Scaled Error.""")
87
+ gr.Dataframe(
88
+ value=leaderboards["MASE"],
89
+ datatype=["markdown", "number", "number", "number"],
90
+ interactive=False,
91
+ )
92
+
93
+ with gr.Tab("📝 About", id=1):
94
+ gr.Markdown(about.ABOUT_LEADERBOARD)
95
+
96
+ if __name__ == "__main__":
97
+ demo.launch(ssr_mode=False)
fev-leaderboard-app.py DELETED
@@ -1,9 +0,0 @@
1
- import streamlit as st
2
-
3
- pages = [
4
- st.Page("pages/fev_bench.py", title="fev-bench", icon=":material/trophy:"),
5
- st.Page("pages/about.py", title="About", icon=":material/info:"),
6
- ]
7
-
8
- page = st.navigation(pages)
9
- page.run()
 
 
 
 
 
 
 
 
 
 
pages/about.py DELETED
@@ -1,19 +0,0 @@
1
- import streamlit as st
2
-
3
- ABOUT_LEADERBOARD = """
4
- ## About
5
-
6
- [**fev**](https://github.com/autogluon/fev) is a lightweight wrapper around the 🤗 [datasets](https://huggingface.co/docs/datasets/en/index) library designed to streamline
7
- benchmarking of time series forecasting models.
8
-
9
- ### 📚 Resources
10
- - **Documentation**: [Official docs](https://autogluon.github.io/fev/latest/)
11
- - **Publication**: ["fev-bench: A Realistic Benchmark for Time Series Forecasting"](https://arxiv.org/abs/2509.26468)
12
- - **Source Code**: [GitHub repository](https://github.com/autogluon/fev)
13
- - **Issues & Questions**: [GitHub Issues](https://github.com/autogluon/fev/issues)
14
-
15
- ### 🚀 Submit Your Model
16
- Ready to add your model to the leaderboard? Follow this [tutorial](https://autogluon.github.io/fev/latest/tutorials/05-add-your-model/) to evaluate your model with fev and contribute your results.
17
- """
18
- st.set_page_config(layout="wide", page_title="About FEV", page_icon=":material/info:")
19
- st.markdown(ABOUT_LEADERBOARD)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
pages/fev_bench.py DELETED
@@ -1,284 +0,0 @@
1
- import sys
2
- from pathlib import Path
3
-
4
- sys.path.append(str(Path(__file__).parent))
5
-
6
- import pandas as pd
7
- import streamlit as st
8
- from src.strings import (
9
- CITATION_FEV,
10
- CITATION_HEADER,
11
- FEV_BENCHMARK_DETAILS,
12
- PAIRWISE_BENCHMARK_DETAILS,
13
- get_pivot_legend,
14
- )
15
- from src.task_groups import (
16
- ALL_TASKS,
17
- DOMAIN_GROUPS,
18
- FREQUENCY_GROUPS,
19
- MINI_TASKS,
20
- TASK_TYPE_GROUPS,
21
- )
22
- from src.utils import (
23
- COLORS,
24
- HIDDEN_MODELS,
25
- construct_pairwise_chart,
26
- filter_hidden_models,
27
- format_leaderboard,
28
- format_metric_name,
29
- get_metric_description,
30
- validate_model_metadata,
31
- )
32
- from streamlit.elements.lib.column_types import ColumnConfig
33
-
34
- st.set_page_config(
35
- layout="wide", page_title="fev leaderboard", page_icon=":material/trophy:"
36
- )
37
-
38
- TITLE = "<h1 style='text-align: center; font-size: 350%;'>fev-bench</h1>"
39
- SORT_COL = "win_rate"
40
- AVAILABLE_METRICS = ["SQL", "MASE", "WQL", "WAPE"]
41
-
42
- # Group type options
43
- GROUP_TYPES = [
44
- "Full (100 tasks)",
45
- "Mini (20 tasks)",
46
- "By frequency",
47
- "By domain",
48
- "By task type",
49
- ]
50
- FREQUENCY_OPTIONS = list(FREQUENCY_GROUPS.keys())
51
- DOMAIN_OPTIONS = list(DOMAIN_GROUPS.keys())
52
- TASK_TYPE_OPTIONS = list(TASK_TYPE_GROUPS.keys())
53
-
54
-
55
- def get_subset_description(
56
- group_type: str, subgroup: str | None, num_tasks: int, metric_name: str
57
- ) -> str:
58
- """Generate a description of the current subset."""
59
- base = f"Results for various forecasting models, measured using the **{metric_name}** metric, on **{num_tasks} tasks**"
60
- if group_type == "Full (100 tasks)":
61
- subset_desc = "from the full **fev-bench** benchmark"
62
- elif group_type == "Mini (20 tasks)":
63
- subset_desc = "from the **fev-bench-mini** subset"
64
- elif group_type == "By frequency":
65
- subset_desc = f"with **{subgroup.lower()}** frequency"
66
- elif group_type == "By task type":
67
- subset_desc = f"of type **{subgroup.lower()}**"
68
- else: # By domain
69
- subset_desc = f"from the **{subgroup}** domain"
70
- paper_link = "[fev-bench: A Realistic Benchmark for Time Series Forecasting](https://arxiv.org/abs/2509.26468)"
71
- return f"{base} {subset_desc}, as described in {paper_link}."
72
-
73
-
74
- # Mapping from UI selections to table directory names
75
- GROUP_DIR_MAPPING = {
76
- "Full (100 tasks)": "full",
77
- "Mini (20 tasks)": "mini",
78
- "Sub-hourly": "frequency_sub_hourly",
79
- "Hourly": "frequency_hourly",
80
- "Daily": "frequency_daily",
81
- "Weekly": "frequency_weekly",
82
- "Monthly+": "frequency_monthly_plus",
83
- "Energy": "domain_energy",
84
- "Nature": "domain_nature",
85
- "Cloud": "domain_cloud",
86
- "Mobility": "domain_mobility",
87
- "Econ": "domain_econ",
88
- "Health": "domain_health",
89
- "Retail": "domain_retail",
90
- "Univariate": "task_type_univariate",
91
- "Covariate-informed": "task_type_covariate_informed",
92
- "Multivariate": "task_type_multivariate",
93
- }
94
-
95
-
96
- @st.cache_data()
97
- def get_leaderboard(metric_name: str, group_dir: str) -> pd.DataFrame:
98
- return pd.read_csv(f"tables/{group_dir}/leaderboard_{metric_name}.csv")
99
-
100
-
101
- @st.cache_data()
102
- def get_pairwise(metric_name: str, group_dir: str) -> pd.DataFrame:
103
- return pd.read_csv(f"tables/{group_dir}/pairwise_{metric_name}.csv")
104
-
105
-
106
- @st.cache_data()
107
- def get_pivot_table(
108
- metric_name: str,
109
- ) -> tuple[pd.DataFrame, pd.DataFrame, pd.DataFrame]:
110
- pivot_df = pd.read_csv(f"tables/pivot_{metric_name}.csv")
111
- baseline_imputed = pd.read_csv(f"tables/pivot_{metric_name}_baseline_imputed.csv")
112
- leakage_imputed = pd.read_csv(f"tables/pivot_{metric_name}_leakage_imputed.csv")
113
- return pivot_df, baseline_imputed, leakage_imputed
114
-
115
-
116
- with st.sidebar:
117
- # Task group selection
118
- selected_group_type = st.selectbox("Subset", options=GROUP_TYPES)
119
-
120
- # Conditional sub-selection for frequency/domain
121
- selected_subgroup = None
122
- if selected_group_type == "By frequency":
123
- selected_subgroup = st.selectbox("Frequency", options=FREQUENCY_OPTIONS)
124
- elif selected_group_type == "By domain":
125
- selected_subgroup = st.selectbox("Domain", options=DOMAIN_OPTIONS)
126
- elif selected_group_type == "By task type":
127
- selected_subgroup = st.selectbox("Task type", options=TASK_TYPE_OPTIONS)
128
-
129
- # Determine the directory to load tables from
130
- if selected_group_type in ["Full (100 tasks)", "Mini (20 tasks)"]:
131
- group_dir = GROUP_DIR_MAPPING[selected_group_type]
132
- task_list = (
133
- ALL_TASKS if selected_group_type == "Full (100 tasks)" else MINI_TASKS
134
- )
135
- else:
136
- group_dir = GROUP_DIR_MAPPING[selected_subgroup]
137
- if selected_group_type == "By frequency":
138
- task_list = FREQUENCY_GROUPS[selected_subgroup]
139
- elif selected_group_type == "By task type":
140
- task_list = TASK_TYPE_GROUPS[selected_subgroup]
141
- else:
142
- task_list = DOMAIN_GROUPS[selected_subgroup]
143
-
144
- st.caption(f"{len(task_list)} tasks")
145
-
146
- st.divider()
147
-
148
- selected_metric = st.selectbox(
149
- "Evaluation Metric", options=AVAILABLE_METRICS, format_func=format_metric_name
150
- )
151
- st.caption(get_metric_description(selected_metric))
152
-
153
- cols = st.columns(spec=[0.025, 0.95, 0.025])
154
-
155
- with cols[1] as main_container:
156
- st.markdown(TITLE, unsafe_allow_html=True)
157
-
158
- metric_df = get_leaderboard(selected_metric, group_dir).sort_values(
159
- by=SORT_COL, ascending=False
160
- )
161
- metric_df = filter_hidden_models(metric_df, "model_name")
162
- validate_model_metadata(metric_df["model_name"])
163
-
164
- pairwise_df = get_pairwise(selected_metric, group_dir)
165
- pairwise_df = filter_hidden_models(
166
- filter_hidden_models(pairwise_df, "model_1"), "model_2"
167
- )
168
-
169
- st.markdown("## :material/trophy: Leaderboard", unsafe_allow_html=True)
170
- st.markdown(
171
- get_subset_description(
172
- selected_group_type, selected_subgroup, len(task_list), selected_metric
173
- ),
174
- unsafe_allow_html=True,
175
- )
176
- df_styled = format_leaderboard(metric_df)
177
- st.dataframe(
178
- df_styled,
179
- width="stretch",
180
- hide_index=True,
181
- column_config={
182
- "model_name": ColumnConfig(label="Model Name", alignment="left"),
183
- "win_rate": st.column_config.NumberColumn(
184
- label="Avg. win rate (%)", format="%.1f"
185
- ),
186
- "skill_score": st.column_config.NumberColumn(
187
- label="Skill score (%)", format="%.1f"
188
- ),
189
- "median_inference_time_s_per100": st.column_config.NumberColumn(
190
- label="Median runtime (s / 100 series)", format="%.1f"
191
- ),
192
- "training_corpus_overlap": st.column_config.NumberColumn(
193
- label="Leakage (%)", format="%d"
194
- ),
195
- "num_failures": st.column_config.NumberColumn(
196
- label="Failed tasks (%)", format="%.0f"
197
- ),
198
- "zero_shot": ColumnConfig(label="Zero-shot", alignment="center"),
199
- "org": ColumnConfig(label="Organization", alignment="left"),
200
- "link": st.column_config.LinkColumn(label="Link", display_text="🔗"),
201
- },
202
- )
203
-
204
- with st.expander("See details"):
205
- st.markdown(FEV_BENCHMARK_DETAILS, unsafe_allow_html=True)
206
-
207
- st.markdown("## :material/bar_chart: Pairwise comparison", unsafe_allow_html=True)
208
- chart_col_1, _, chart_col_2 = st.columns(spec=[0.45, 0.1, 0.45])
209
-
210
- with chart_col_1:
211
- st.altair_chart(
212
- construct_pairwise_chart(
213
- pairwise_df, col="win_rate", metric_name=selected_metric
214
- ),
215
- use_container_width=True,
216
- )
217
-
218
- with chart_col_2:
219
- st.altair_chart(
220
- construct_pairwise_chart(
221
- pairwise_df, col="skill_score", metric_name=selected_metric
222
- ),
223
- use_container_width=True,
224
- )
225
-
226
- with st.expander("See details"):
227
- st.markdown(PAIRWISE_BENCHMARK_DETAILS, unsafe_allow_html=True)
228
-
229
- st.markdown(
230
- "## :material/table_chart: Results for individual tasks", unsafe_allow_html=True
231
- )
232
- with st.expander("Show detailed results"):
233
- st.markdown(
234
- get_pivot_legend("Seasonal Naive", "Chronos-Bolt"), unsafe_allow_html=True
235
- )
236
- pivot_df, baseline_imputed, leakage_imputed = get_pivot_table(selected_metric)
237
- pivot_df = pivot_df.set_index("Task name")
238
- baseline_imputed = baseline_imputed.set_index("Task name")
239
- leakage_imputed = leakage_imputed.set_index("Task name")
240
-
241
- # Drop columns for models hidden from the leaderboard
242
- hidden_cols = [c for c in pivot_df.columns if c in HIDDEN_MODELS]
243
- pivot_df = pivot_df.drop(columns=hidden_cols)
244
- baseline_imputed = baseline_imputed.drop(columns=hidden_cols)
245
- leakage_imputed = leakage_imputed.drop(columns=hidden_cols)
246
-
247
- # Filter pivot table to only show tasks in the selected group
248
- available_tasks = [t for t in task_list if t in pivot_df.index]
249
- pivot_df = pivot_df.loc[available_tasks]
250
- baseline_imputed = baseline_imputed.loc[available_tasks]
251
- leakage_imputed = leakage_imputed.loc[available_tasks]
252
-
253
- def style_pivot_table(errors, is_baseline_imputed, is_leakage_imputed):
254
- rank_colors = {1: COLORS["gold"], 2: COLORS["silver"], 3: COLORS["bronze"]}
255
-
256
- def highlight_by_position(styler):
257
- for row_idx in errors.index:
258
- row_ranks = errors.loc[row_idx].rank(method="min")
259
- for col_idx in errors.columns:
260
- rank = row_ranks[col_idx]
261
- style_parts = []
262
- if rank <= 3:
263
- style_parts.append(f"background-color: {rank_colors[rank]}")
264
- if is_leakage_imputed.loc[row_idx, col_idx]:
265
- style_parts.append(f"color: {COLORS['leakage_impute']}")
266
- elif is_baseline_imputed.loc[row_idx, col_idx]:
267
- style_parts.append(f"color: {COLORS['failure_impute']}")
268
- elif not style_parts:
269
- style_parts.append(f"color: {COLORS['text_default']}")
270
- if style_parts:
271
- styler = styler.map(
272
- lambda x, s="; ".join(style_parts): s,
273
- subset=pd.IndexSlice[row_idx:row_idx, col_idx:col_idx],
274
- )
275
- return styler
276
-
277
- return highlight_by_position(errors.style).format(precision=3)
278
-
279
- st.dataframe(style_pivot_table(pivot_df, baseline_imputed, leakage_imputed))
280
-
281
- st.divider()
282
- st.markdown("### :material/format_quote: Citation", unsafe_allow_html=True)
283
- st.markdown(CITATION_HEADER)
284
- st.markdown(CITATION_FEV)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
pyproject.toml CHANGED
@@ -1,12 +1,13 @@
1
- [project]
2
- name = "hf-leaderboard"
3
- version = "0.1.0"
4
- requires-python = ">=3.11"
5
- dependencies = [
6
- "altair>=6.0.0",
7
- "fev>=0.7.0",
8
- "numpy<2.2",
9
- "pyarrow<21",
10
- "scipy<1.15",
11
- "streamlit>=1.53.1",
12
- ]
 
 
1
+ [tool.ruff]
2
+ # Enable pycodestyle (`E`) and Pyflakes (`F`) codes by default.
3
+ select = ["E", "F"]
4
+ ignore = ["E501"] # line too long (black is taking care of this)
5
+ line-length = 119
6
+ fixable = ["A", "B", "C", "D", "E", "F", "G", "I", "N", "Q", "S", "T", "W", "ANN", "ARG", "BLE", "COM", "DJ", "DTZ", "EM", "ERA", "EXE", "FBT", "ICN", "INP", "ISC", "NPY", "PD", "PGH", "PIE", "PL", "PT", "PTH", "PYI", "RET", "RSE", "RUF", "SIM", "SLF", "TCH", "TID", "TRY", "UP", "YTT"]
7
+
8
+ [tool.isort]
9
+ profile = "black"
10
+ line_length = 119
11
+
12
+ [tool.black]
13
+ line-length = 119
requirements.txt CHANGED
@@ -1,7 +1,11 @@
 
 
 
 
 
 
 
1
  matplotlib
2
  numpy
3
  pandas
4
- requests
5
- streamlit==1.49.1
6
- fev>=0.6.0
7
- altair>=5.5.0
 
1
+ APScheduler
2
+ black
3
+ datasets
4
+ gradio
5
+ gradio[oauth]
6
+ gradio_client
7
+ huggingface-hub>=0.18.0
8
  matplotlib
9
  numpy
10
  pandas
11
+ fev==0.4.0
 
 
 
save_tables.py DELETED
@@ -1,241 +0,0 @@
1
- #!/usr/bin/env python3
2
-
3
- import argparse
4
- import importlib.util
5
- import io
6
- import sys
7
- from pathlib import Path
8
-
9
- import requests
10
-
11
- sys.path.append(str(Path(__file__).parent))
12
-
13
- import fev
14
- import pandas as pd
15
-
16
- from src.task_groups import ALL_TASKS, DOMAIN_GROUPS, FREQUENCY_GROUPS, MINI_TASKS, TASK_TYPE_GROUPS
17
-
18
- GITHUB_REPO = "autogluon/fev"
19
- RESULTS_PATH = "benchmarks/fev_bench/results"
20
-
21
- # Default location of the local fev clone (sibling of this repo); override with --fev-repo
22
- DEFAULT_FEV_REPO = Path(__file__).resolve().parent.parent / "core"
23
-
24
-
25
- def load_fev_bench_module(fev_repo: Path):
26
- """Load shared compute logic from the fev repo's figure-generation script.
27
-
28
- This keeps the leaderboard and the fev paper-figure script using a single source of truth for
29
- the benchmark config (baseline/leakage models, metrics) and the leaderboard/pairwise compute.
30
- """
31
- script_path = fev_repo / "scripts" / "generate_fev_bench_figures.py"
32
- if not script_path.exists():
33
- raise FileNotFoundError(
34
- f"Could not find the fev figure script at {script_path}. "
35
- "Clone autogluon/fev next to this repo, or pass --fev-repo with your local fev checkout."
36
- )
37
- spec = importlib.util.spec_from_file_location("fev_bench_figures", script_path)
38
- module = importlib.util.module_from_spec(spec)
39
- spec.loader.exec_module(module)
40
- return module
41
-
42
-
43
- # All task groups to generate tables for
44
- TASK_GROUPS = {
45
- "full": ALL_TASKS,
46
- "mini": MINI_TASKS,
47
- "frequency_sub_hourly": FREQUENCY_GROUPS["Sub-hourly"],
48
- "frequency_hourly": FREQUENCY_GROUPS["Hourly"],
49
- "frequency_daily": FREQUENCY_GROUPS["Daily"],
50
- "frequency_weekly": FREQUENCY_GROUPS["Weekly"],
51
- "frequency_monthly_plus": FREQUENCY_GROUPS["Monthly+"],
52
- "domain_energy": DOMAIN_GROUPS["Energy"],
53
- "domain_nature": DOMAIN_GROUPS["Nature"],
54
- "domain_cloud": DOMAIN_GROUPS["Cloud"],
55
- "domain_mobility": DOMAIN_GROUPS["Mobility"],
56
- "domain_econ": DOMAIN_GROUPS["Econ"],
57
- "domain_health": DOMAIN_GROUPS["Health"],
58
- "domain_retail": DOMAIN_GROUPS["Retail"],
59
- "task_type_univariate": TASK_TYPE_GROUPS["Univariate"],
60
- "task_type_covariate_informed": TASK_TYPE_GROUPS["Covariate-informed"],
61
- "task_type_multivariate": TASK_TYPE_GROUPS["Multivariate"],
62
- }
63
-
64
-
65
- def get_csv_files_from_github(commit: str) -> list[str]:
66
- """Get list of CSV file paths from the GitHub repo at a specific commit."""
67
- api_url = f"https://api.github.com/repos/{GITHUB_REPO}/contents/{RESULTS_PATH}?ref={commit}"
68
- response = requests.get(api_url)
69
- response.raise_for_status()
70
-
71
- files = response.json()
72
- csv_files = [f["path"] for f in files if f["name"].endswith(".csv")]
73
-
74
- if not csv_files:
75
- raise FileNotFoundError(f"No CSV files found in {RESULTS_PATH} at commit {commit}")
76
-
77
- return csv_files
78
-
79
-
80
- def load_summaries_from_github(commit: str) -> pd.DataFrame:
81
- """Load and concatenate all CSV summaries from the GitHub repo at a specific commit."""
82
- csv_files = get_csv_files_from_github(commit)
83
- print(f"Found {len(csv_files)} CSV files")
84
-
85
- dfs = []
86
- for file_path in csv_files:
87
- raw_url = f"https://raw.githubusercontent.com/{GITHUB_REPO}/{commit}/{file_path}"
88
- response = requests.get(raw_url)
89
- response.raise_for_status()
90
- df = pd.read_csv(io.StringIO(response.text))
91
- dfs.append(df)
92
- print(f" Loaded: {Path(file_path).name}")
93
-
94
- return pd.concat(dfs, ignore_index=True)
95
-
96
-
97
- def compute_pivot_table(
98
- summaries: pd.DataFrame,
99
- metric_name: str,
100
- baseline_model: str,
101
- leakage_imputation_model: str,
102
- ) -> tuple[pd.DataFrame, pd.DataFrame, pd.DataFrame]:
103
- errors = fev.pivot_table(summaries=summaries, metric_column=metric_name, task_columns=["task_name"])
104
- train_overlap = (
105
- fev.pivot_table(summaries=summaries, metric_column="trained_on_this_dataset", task_columns=["task_name"])
106
- .fillna(False)
107
- .astype(bool)
108
- )
109
-
110
- is_imputed_baseline = errors.isna()
111
- is_leakage_imputed = train_overlap
112
-
113
- # Handle imputations
114
- errors = errors.mask(train_overlap, errors[leakage_imputation_model], axis=0)
115
- for col in errors.columns:
116
- if col != baseline_model:
117
- errors[col] = errors[col].fillna(errors[baseline_model])
118
-
119
- errors = errors[errors.rank(axis=1).mean().sort_values().index]
120
- is_imputed_baseline = is_imputed_baseline[errors.columns]
121
- is_leakage_imputed = is_leakage_imputed[errors.columns]
122
-
123
- errors.index.rename("Task name", inplace=True)
124
- is_imputed_baseline.index.rename("Task name", inplace=True)
125
- is_leakage_imputed.index.rename("Task name", inplace=True)
126
-
127
- return errors.reset_index(), is_imputed_baseline.reset_index(), is_leakage_imputed.reset_index()
128
-
129
-
130
- def load_summaries_from_local(path: Path) -> pd.DataFrame:
131
- """Load and concatenate all CSV summaries from a local directory."""
132
- csv_files = sorted(path.glob("*.csv"))
133
- if not csv_files:
134
- raise FileNotFoundError(f"No CSV files found in {path}")
135
-
136
- print(f"Found {len(csv_files)} CSV files")
137
- dfs = []
138
- for f in csv_files:
139
- df = pd.read_csv(f)
140
- dfs.append(df)
141
- print(f" Loaded: {f.name}")
142
-
143
- return pd.concat(dfs, ignore_index=True)
144
-
145
-
146
- def main():
147
- parser = argparse.ArgumentParser(description="Generate leaderboard tables from CSV summaries in the fev repo")
148
- parser.add_argument(
149
- "commit",
150
- nargs="?",
151
- default="main",
152
- help=f"Git commit SHA or branch name in the {GITHUB_REPO} repository (default: main)",
153
- )
154
- parser.add_argument(
155
- "--local",
156
- type=Path,
157
- help="Path to a local directory containing result CSV files (skips GitHub fetching)",
158
- )
159
- parser.add_argument(
160
- "--fev-repo",
161
- type=Path,
162
- default=DEFAULT_FEV_REPO,
163
- help=f"Path to a local clone of the fev repo, used for shared compute logic (default: {DEFAULT_FEV_REPO})",
164
- )
165
- args = parser.parse_args()
166
-
167
- # Load shared benchmark config + compute layer from the fev repo (single source of truth)
168
- fev_bench = load_fev_bench_module(args.fev_repo)
169
- baseline_model = fev_bench.BASELINE_MODEL
170
- leakage_imputation_model = fev_bench.LEAKAGE_IMPUTATION_MODEL
171
- sort_col = fev_bench.SORT_COL
172
- top_k_models_to_plot = fev_bench.TOP_K_MODELS_TO_PLOT
173
- available_metrics = fev_bench.AVAILABLE_METRICS
174
- compute_leaderboard = fev_bench.compute_leaderboard
175
- compute_pairwise = fev_bench.compute_pairwise
176
-
177
- # Create tables directory
178
- tables_dir = Path("tables")
179
- tables_dir.mkdir(exist_ok=True)
180
-
181
- if args.local:
182
- print(f"Loading summaries from local path: {args.local}")
183
- summaries = load_summaries_from_local(args.local)
184
- else:
185
- print(f"Loading summaries from {GITHUB_REPO} at commit {args.commit}...")
186
- summaries = load_summaries_from_github(args.commit)
187
-
188
- # Save raw summaries for on-the-fly subset computation
189
- summaries.to_csv(tables_dir / "summaries.csv", index=False)
190
- print("Saved: summaries.csv")
191
-
192
- # Generate pivot tables (full version only, at root level)
193
- for metric in available_metrics:
194
- print(f"Processing pivot table for {metric}...")
195
- pivot_df, baseline_imputed, leakage_imputed = compute_pivot_table(
196
- summaries, metric, baseline_model, leakage_imputation_model
197
- )
198
- pivot_df.to_csv(tables_dir / f"pivot_{metric}.csv", index=False)
199
- baseline_imputed.to_csv(tables_dir / f"pivot_{metric}_baseline_imputed.csv", index=False)
200
- leakage_imputed.to_csv(tables_dir / f"pivot_{metric}_leakage_imputed.csv", index=False)
201
- print(f" Saved: pivot_{metric}.csv")
202
-
203
- # Generate leaderboard and pairwise tables for each task group
204
- for group_name, task_list in TASK_GROUPS.items():
205
- print(f"\nProcessing group: {group_name} ({len(task_list)} tasks)...")
206
-
207
- # Create subdirectory for this group
208
- group_dir = tables_dir / group_name
209
- group_dir.mkdir(exist_ok=True)
210
-
211
- # Filter summaries to only include tasks in this group
212
- group_summaries = summaries[summaries["task_name"].isin(task_list)]
213
-
214
- if group_summaries.empty:
215
- print(f" WARNING: No matching tasks found for group {group_name}")
216
- continue
217
-
218
- actual_tasks = group_summaries["task_name"].nunique()
219
- print(f" Found {actual_tasks} tasks in summaries")
220
-
221
- for metric in available_metrics:
222
- # Compute leaderboard for this group
223
- leaderboard_df = compute_leaderboard(group_summaries, metric)
224
- leaderboard_df.to_csv(group_dir / f"leaderboard_{metric}.csv", index=False)
225
-
226
- # Get top models for pairwise comparison
227
- top_k_models = (
228
- leaderboard_df.sort_values(by=sort_col, ascending=False).head(top_k_models_to_plot)["model_name"].tolist()
229
- )
230
-
231
- # Compute pairwise comparison
232
- pairwise_df = compute_pairwise(group_summaries, metric, top_k_models)
233
- pairwise_df.to_csv(group_dir / f"pairwise_{metric}.csv", index=False)
234
-
235
- print(f" Saved: {group_name}/leaderboard_{metric}.csv, {group_name}/pairwise_{metric}.csv")
236
-
237
- print(f"\nAll tables saved to {tables_dir}/")
238
-
239
-
240
- if __name__ == "__main__":
241
- main()
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
src/about.py ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ TITLE = """<h1 align="center" id="space-title">Forecast evaluation leaderboard</h1>"""
2
+
3
+ # What does your leaderboard evaluate?
4
+ INTRODUCTION_TEXT = """
5
+ This space hosts evaluation results for time series forecasting models.
6
+
7
+ The results are obtained using [fev](https://github.com/autogluon/fev) - a lightweight library for evaluating time series forecasting models.
8
+ """
9
+
10
+ ABOUT_LEADERBOARD = """
11
+ ## What is `fev`?
12
+
13
+ [`fev`](https://github.com/autogluon/fev) is a lightweight wrapper around the 🤗 [`datasets`](https://huggingface.co/docs/datasets/en/index) library that makes it easy to benchmark time series forecasting models.
14
+
15
+ For more information about `fev`, please check out [github.com/autogluon/fev](https://github.com/autogluon/fev).
16
+
17
+ Currently, the results in this space are a minimal proof of concept. We plan to add new benchmark datasets and tasks in the future.
18
+
19
+ ## How is `fev` different from other benchmarking tools?
20
+ Existing forecasting benchmarks usually fall into one of two categories:
21
+
22
+ - Standalone datasets without any supporting infrastructure. These provide no guarantees that the results obtained by different users are comparable. For example, changing the start date or duration of the forecast horizon totally changes the meaning of the scores.
23
+ - Bespoke end-to-end systems that combine models, datasets and forecasting tasks. Such packages usually come with lots of dependencies and assumptions, which makes extending or integrating these libraries into existing systems difficult.
24
+
25
+ `fev` aims for the middle ground - it provides the core benchmarking functionality without introducing unnecessary constraints or bloated dependencies. The library supports point & probabilistic forecasting, different types of covariates, as well as all popular forecasting metrics.
26
+
27
+
28
+ ## Submitting your model
29
+ For instructions on how to evaluate your model using `fev` and contribute your results to the leaderboard, please follow the [instructions in the GitHub repo](https://github.com/autogluon/fev/blob/main/docs/04-models.ipynb).
30
+ """
31
+
32
+ CHRONOS_BENCHMARK = """
33
+ ## Chronos Benchmark II results
34
+
35
+ This tab contains results for various forecasting models on the 27 datasets used in Benchmark II in the publication [Chronos: Learning the Language of Time Series](https://arxiv.org/abs/2403.07815).
36
+
37
+ These datasets were used for zero-shot evaluation of Chronos models (i.e., Chronos models were not trained on these datasets), but some other models did include certain datasets in their training corpus.
38
+
39
+ Each table contains the following information:
40
+
41
+ * **Average relative error**: Geometric mean of the relative errors for each task. The relative error for each task is computed as `model_error / baseline_error`.
42
+ * **Average rank**: Arithmetic mean of the ranks achieved by each model on each task.
43
+ * **Median inference time (s)**: Median of the times required to make predictions for the entire dataset (in seconds).
44
+ * **Training corpus overlap (%)**: Percentage of the datasets used in the benchmark that were included in the model's training corpus. Zero-shot models are highlighted in <span style="color:green; font-weight:bold;">green</span>.
45
+
46
+ Lower values are better for all of the above metrics.
47
+
48
+ Task definitions and the detailed results are available on [GitHub](https://github.com/autogluon/fev/tree/main/benchmarks/chronos_zeroshot). More information for the datasets is available in [Table 3 of the paper](https://arxiv.org/abs/2403.07815).
49
+
50
+ """
src/colors.py DELETED
@@ -1,6 +0,0 @@
1
- # Legacy colors - kept for backward compatibility if needed elsewhere
2
- VERY_PALE_PURPLE = "#e8d9f3"
3
- VERY_PALE_GREEN = "#cffdbc"
4
- VERY_PALE_BLUE = "#d6fffe"
5
- DEEP_LAVENDER = "#8d5eb7"
6
- GRASS_GREEN = "#3f9b0b"
 
 
 
 
 
 
 
src/custom_html_js.py ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ custom_css = """
2
+
3
+ .markdown-text {
4
+ font-size: 20px !important;
5
+ }
6
+
7
+ """
8
+
9
+
10
+ # .tab-buttons button {
11
+ # font-size: 20px;
12
+ # }
13
+
14
+ # #citation-button span {
15
+ # font-size: 16px !important;
16
+ # }
17
+
18
+ # #citation-button textarea {
19
+ # font-size: 16px !important;
20
+ # }
21
+
22
+ # #citation-button > label > button {
23
+ # margin: 6px;
24
+ # transform: scale(1.3);
25
+ # }
26
+
27
+
28
+ # #leaderboard-table-lite {
29
+ # margin-top: 15px
30
+ # }
31
+
32
+ # #search-bar-table-box > div:first-child {
33
+ # background: none;
34
+ # border: none;
35
+ # }
36
+
37
+ # #search-bar {
38
+ # padding: 0px;
39
+ # }
40
+
41
+ # /* Hides the final AutoEvalColumn */
42
+ # #llm-benchmark-tab-table table td:last-child,
43
+ # #llm-benchmark-tab-table table th:last-child {
44
+ # display: none;
45
+ # }
46
+
47
+ # /* Limit the width of the first AutoEvalColumn so that names don't expand too much */
48
+ # table td:first-child,
49
+ # table th:first-child {
50
+ # max-width: 400px;
51
+ # overflow: auto;
52
+ # white-space: nowrap;
53
+ # }
54
+
55
+
56
+ # #scale-logo {
57
+ # border-style: none !important;
58
+ # box-shadow: none;
59
+ # display: block;
60
+ # margin-left: auto;
61
+ # margin-right: auto;
62
+ # max-width: 600px;
63
+ # }
64
+
65
+ # #scale-logo .download {
66
+ # display: none;
67
+ # }
68
+ # #filter_type{
69
+ # border: 0;
70
+ # padding-left: 0;
71
+ # padding-top: 0;
72
+ # }
73
+ # #filter_type label {
74
+ # display: flex;
75
+ # }
76
+ # #filter_type label > span{
77
+ # margin-top: var(--spacing-lg);
78
+ # margin-right: 0.5em;
79
+ # }
80
+ # #filter_type label > .wrap{
81
+ # width: 103px;
82
+ # }
83
+ # #filter_type label > .wrap .wrap-inner{
84
+ # padding: 2px;
85
+ # }
86
+ # #filter_type label > .wrap .wrap-inner input{
87
+ # width: 1px
88
+ # }
89
+ # #filter-columns-type{
90
+ # border:0;
91
+ # padding:0.5;
92
+ # }
93
+ # #filter-columns-size{
94
+ # border:0;
95
+ # padding:0.5;
96
+ # }
97
+ # #box-filter > .form{
98
+ # border: 0
99
+ # }
src/formatting.py ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ def model_hyperlink(link, model_name):
2
+ return f'<a target="_blank" href="{link}" style="color: var(--link-text-color); text-decoration: underline;text-decoration-style: dotted;">{model_name}</a>'
3
+
4
+
5
+ MODEL_URLS = {
6
+ "chronos_tiny": "amazon/chronos-t5-tiny",
7
+ "chronos_mini": "amazon/chronos-t5-mini",
8
+ "chronos_small": "amazon/chronos-t5-small",
9
+ "chronos_base": "amazon/chronos-t5-base",
10
+ "chronos_large": "amazon/chronos-t5-large",
11
+ "chronos_bolt_tiny": "amazon/chronos-bolt-tiny",
12
+ "chronos_bolt_mini": "amazon/chronos-bolt-mini",
13
+ "chronos_bolt_small": "amazon/chronos-bolt-small",
14
+ "chronos_bolt_base": "amazon/chronos-bolt-base",
15
+ "moirai_large": "Salesforce/moirai-1.1-R-large",
16
+ "moirai_base": "Salesforce/moirai-1.1-R-base",
17
+ "moirai_small": "Salesforce/moirai-1.1-R-small",
18
+ "timesfm": "google/timesfm-1.0-200m-pytorch",
19
+ "timesfm-2.0": "google/timesfm-2.0-500m-pytorch",
20
+ "ttm-r2": "ibm-granite/granite-timeseries-ttm-r2",
21
+ "tirex": "NX-AI/TiRex",
22
+ }
23
+
24
+
25
+ def make_clickable_model(model_name):
26
+ if model_name in MODEL_URLS:
27
+ model_path = MODEL_URLS.get(model_name)
28
+ link = f"https://huggingface.co/{model_path}"
29
+ return model_hyperlink(link, model_name)
30
+ else:
31
+ return model_name
src/streamlit_app.py DELETED
@@ -1,9 +0,0 @@
1
- import streamlit as st
2
-
3
- pages = [
4
- st.Page("../pages/fev_bench.py", title="fev-bench", icon=":material/trophy:"),
5
- st.Page("../pages/about.py", title="About", icon=":material/info:"),
6
- ]
7
-
8
- page = st.navigation(pages)
9
- page.run()
 
 
 
 
 
 
 
 
 
 
src/strings.py DELETED
@@ -1,114 +0,0 @@
1
- from src.utils import COLORS
2
-
3
- INTRODUCTION_TEXT = """
4
- This space hosts evaluation results for time series forecasting models. The results are obtained using [fev](https://github.com/autogluon/fev) - a lightweight library for evaluating time series forecasting models.
5
- """
6
-
7
- LEGEND = """
8
- """
9
-
10
- TABLE_INFO = f"""
11
- The leaderboard summarizes the performance of all models evaluated on the 100 tasks comprising **fev-bench**. More details available in the [paper](https://arxiv.org/abs/2509.26468).
12
-
13
- Model names are colored by type: <span style='color: {COLORS["pretrained_text"]}; font-weight: bold;'>Pretrained</span>, <span style='color: {COLORS["task_specific_text"]}; font-weight: bold;'>Task-specific</span>, and <span style='color: {COLORS["statistical_text"]}; font-weight: bold;'>Statistical</span>.
14
-
15
- The full matrix $E_{{rj}}$ with the error of each model $j$ on task $r$ is available at the bottom of the page.
16
-
17
- * **Avg. win rate (%)**: Fraction of all possible model pairs and tasks where this model achieves lower error than the competing model. For model $j$, defined as $W_j = \\frac{{1}}{{R(M-1)}} \\sum_{{r=1}}^{{R}} \\sum_{{k \\neq j}} (\\mathbf{{1}}(E_{{rj}} < E_{{rk}}) + 0.5 \\cdot \\mathbf{{1}}(E_{{rj}} = E_{{rk}}))$ where $R$ is number of tasks, $M$ is number of models. Ties count as half-wins.
18
-
19
- Ranges from 0% (worst) to 100% (best). Higher values are better. This value changes as new models are added to the benchmark.
20
-
21
- * **Skill score (%)**: Measures how much the model reduces forecasting error compared to the Seasonal Naive baseline. Computed as $S_j = 100 \\times (1 - \\sqrt[R]{{\\prod_{{r=1}}^{{R}} E_{{rj}}/E_{{r\\beta}}}})$, where $E_{{r\\beta}}$ is baseline error on task $r$. Relative errors are clipped between 0.01 and 100 before aggregation to avoid extreme outliers. Positive values indicate better-than-baseline performance, negative values indicate worse-than-baseline performance.
22
-
23
- Higher values are better. This value does not change as new models are added to the benchmark.
24
-
25
- * **Median runtime (s)**: Median end-to-end time (training + prediction across all evaluation windows) in seconds. Note that inference times depend on hardware, batch sizes, and implementation details, so these serve as a rough guide rather than definitive performance benchmarks.
26
-
27
- * **Leakage (%)**: For zero-shot models, percentage of benchmark datasets included in the model's training corpus. Results for tasks with reported overlap are replaced with Chronos-Bolt (Base) performance to prevent data leakage.
28
-
29
- * **Failed tasks (%)**: Percentage of tasks where the model failed to produce a forecast. Results for failed tasks are replaced with Seasonal Naive performance.
30
-
31
- * **Zero-shot**: Indicates whether the model can make predictions without task-specific training (✓ = zero-shot, × = task-specific).
32
- """
33
-
34
- CHRONOS_BENCHMARK_BASIC_INFO = f"""
35
- **Chronos Benchmark II** contains results for various forecasting models on the 27 datasets used in Benchmark II in the paper [Chronos: Learning the Language of Time Series](https://arxiv.org/abs/2403.07815). {LEGEND}
36
- """
37
-
38
- CHRONOS_BENCHMARK_DETAILS = f"""
39
- {TABLE_INFO}
40
-
41
- Task definitions and the detailed results are available on [GitHub](https://github.com/autogluon/fev/tree/main/benchmarks/chronos_zeroshot). More information for the datasets is available in [Table 3 of the paper](https://arxiv.org/abs/2403.07815).
42
- """
43
-
44
- FEV_BENCHMARK_BASIC_INFO = f"""
45
- Results for various forecasting models on 100 tasks of the **fev-bench** benchmark, as described in [fev-bench: A Realistic Benchmark for Time Series Forecasting](https://arxiv.org/abs/2509.26468). {LEGEND}
46
- """
47
-
48
- FEV_BENCHMARK_DETAILS = f"""
49
- {TABLE_INFO}
50
-
51
- Task definitions and the detailed results are available on [GitHub](https://github.com/autogluon/fev/tree/main/benchmarks/fev_bench/). For model wrappers, see [`models/`](https://github.com/autogluon/fev/tree/main/models). Datasets used for evaluation are available on [Hugging Face](https://huggingface.co/datasets/autogluon/fev_datasets).
52
- """
53
-
54
- CITATION_HEADER = """
55
- If you find this leaderboard useful for your research, please consider citing the associated paper(s):
56
-
57
- """
58
- CITATION_FEV = """
59
- ```
60
- @article{shchur2025fev,
61
- title={{fev-bench}: A Realistic Benchmark for Time Series Forecasting},
62
- author={Shchur, Oleksandr and Ansari, Abdul Fatir and Turkmen, Caner and Stella, Lorenzo and Erickson, Nick and Guerron, Pablo and Bohlke-Schneider, Michael and Wang, Yuyang},
63
- year={2025},
64
- eprint={2509.26468},
65
- archivePrefix={arXiv},
66
- primaryClass={cs.LG}
67
- }
68
- ```
69
- """
70
-
71
-
72
- def get_pivot_legend(baseline_model: str, leakage_imputation_model: str) -> str:
73
- return f"""
74
- Task definitions and raw results in CSV format are available on [GitHub](https://github.com/autogluon/fev/tree/main/benchmarks/fev_bench).
75
-
76
- Best results for each task are marked with
77
- <span style='background: {COLORS["gold"]}; color: {COLORS["text_default"]}; padding: 3px; border-radius: 5px;'>🥇 1st</span>
78
- <span style='background: {COLORS["silver"]}; color: {COLORS["text_default"]}; padding: 3px; border-radius: 5px;'>🥈 2nd</span>
79
- <span style='background: {COLORS["bronze"]}; color: {COLORS["text_default"]}; padding: 3px; border-radius: 5px;'>🥉 3rd</span>
80
- <br><br>
81
- **Imputation:**
82
- - <span style='color: {COLORS["failure_impute"]}; font-weight: bold;'>Failed tasks</span> imputed by {baseline_model}
83
- - <span style='color: {COLORS["leakage_impute"]}; font-weight: bold;'>Leaky tasks</span> imputed by {leakage_imputation_model}
84
- """
85
-
86
-
87
- PAIRWISE_BENCHMARK_DETAILS = """
88
- The pairwise charts show head-to-head results between models:
89
-
90
- * **Win rate**: Percentage of tasks where Model 1 achieves lower error than Model 2 (ties count as half-wins).
91
- A value above 50% means Model 1 is more accurate than Model 2 on average.
92
-
93
- * **Skill score**: Average relative error reduction of Model 1 with respect to Model 2.
94
- A positive value means Model 1 reduces forecasting error compared to Model 2 on average.
95
-
96
- **Confidence Intervals**: 95% intervals are estimated using 1000 bootstrap samples over tasks.
97
- For each bootstrap sample, tasks are resampled with replacement and the pairwise win rate / skill score are recomputed.
98
- The intervals correspond to the 2.5th and 97.5th percentiles of these bootstrap distributions,
99
- capturing how model comparisons vary under alternative benchmark compositions.
100
- """
101
-
102
-
103
- CITATION_CHRONOS = """
104
- ```
105
- @article{ansari2024chronos,
106
- title={Chronos: Learning the Language of Time Series},
107
- author={Ansari, Abdul Fatir and Stella, Lorenzo and Turkmen, Caner and Zhang, Xiyuan, and Mercado, Pedro and Shen, Huibin and Shchur, Oleksandr and Rangapuram, Syama Syndar and Pineda Arango, Sebastian and Kapoor, Shubham and Zschiegner, Jasper and Maddix, Danielle C. and Wang, Hao and Mahoney, Michael W. and Torkkola, Kari and Gordon Wilson, Andrew and Bohlke-Schneider, Michael and Wang, Yuyang},
108
- journal={Transactions on Machine Learning Research},
109
- issn={2835-8856},
110
- year={2024},
111
- url={https://openreview.net/forum?id=gerNCVqqtR}
112
- }
113
- ```
114
- """
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
src/task_groups.py DELETED
@@ -1,266 +0,0 @@
1
- """Task groupings for filtering the leaderboard by subsets."""
2
-
3
- # All tasks in the benchmark (100 tasks)
4
- ALL_TASKS = [
5
- "ETT_15T", "ETT_1D", "ETT_1H", "ETT_1W",
6
- "LOOP_SEATTLE_1D", "LOOP_SEATTLE_1H", "LOOP_SEATTLE_5T",
7
- "M_DENSE_1D", "M_DENSE_1H",
8
- "SZ_TAXI_15T", "SZ_TAXI_1H",
9
- "australian_tourism",
10
- "bizitobs_l2c_1H", "bizitobs_l2c_5T",
11
- "boomlet_1062", "boomlet_1209", "boomlet_1225", "boomlet_1230", "boomlet_1282",
12
- "boomlet_1487", "boomlet_1631", "boomlet_1676", "boomlet_1855", "boomlet_1975",
13
- "boomlet_2187", "boomlet_285", "boomlet_619", "boomlet_772", "boomlet_963",
14
- "ecdc_ili",
15
- "entsoe_15T", "entsoe_1H", "entsoe_30T",
16
- "epf_be", "epf_de", "epf_fr", "epf_np", "epf_pjm",
17
- "ercot_1D", "ercot_1H", "ercot_1M", "ercot_1W",
18
- "favorita_stores_1D", "favorita_stores_1M", "favorita_stores_1W",
19
- "favorita_transactions_1D", "favorita_transactions_1M", "favorita_transactions_1W",
20
- "fred_md_2025/cee", "fred_md_2025/macro",
21
- "fred_qd_2025/cee", "fred_qd_2025/macro",
22
- "gvar",
23
- "hermes",
24
- "hierarchical_sales_1D", "hierarchical_sales_1W",
25
- "hospital", "hospital_admissions_1D", "hospital_admissions_1W",
26
- "jena_weather_10T", "jena_weather_1D", "jena_weather_1H",
27
- "kdd_cup_2022_10T", "kdd_cup_2022_1D", "kdd_cup_2022_30T",
28
- "m5_1D", "m5_1M", "m5_1W",
29
- "proenfo_gfc12", "proenfo_gfc14", "proenfo_gfc17",
30
- "redset_15T", "redset_1H", "redset_5T",
31
- "restaurant",
32
- "rohlik_orders_1D", "rohlik_orders_1W", "rohlik_sales_1D", "rohlik_sales_1W",
33
- "rossmann_1D", "rossmann_1W",
34
- "solar_1D", "solar_1W", "solar_with_weather_15T", "solar_with_weather_1H",
35
- "uci_air_quality_1D", "uci_air_quality_1H",
36
- "uk_covid_nation_1D/cumulative", "uk_covid_nation_1D/new",
37
- "uk_covid_nation_1W/cumulative", "uk_covid_nation_1W/new",
38
- "uk_covid_utla_1D/new", "uk_covid_utla_1W/cumulative",
39
- "us_consumption_1M", "us_consumption_1Q", "us_consumption_1Y",
40
- "walmart",
41
- "world_co2_emissions", "world_life_expectancy", "world_tourism",
42
- ]
43
-
44
- # Mini benchmark - representative subset (20 tasks)
45
- MINI_TASKS = [
46
- "jena_weather_1H",
47
- "M_DENSE_1D",
48
- "bizitobs_l2c_5T",
49
- "rohlik_orders_1D",
50
- "boomlet_1282",
51
- "rossmann_1D",
52
- "rossmann_1W",
53
- "boomlet_1676",
54
- "solar_with_weather_1H",
55
- "boomlet_619",
56
- "uci_air_quality_1H",
57
- "uk_covid_nation_1D/cumulative",
58
- "us_consumption_1Y",
59
- "epf_np",
60
- "world_co2_emissions",
61
- "ETT_15T",
62
- "ETT_1H",
63
- "proenfo_gfc14",
64
- "hospital_admissions_1D",
65
- "hospital_admissions_1W",
66
- ]
67
-
68
- # Frequency-based groupings
69
- FREQUENCY_GROUPS = {
70
- "Sub-hourly": [
71
- # T (1 minute)
72
- "boomlet_1225", "boomlet_1282", "boomlet_285", "boomlet_619", "boomlet_772", "boomlet_963",
73
- # 5T (5 minutes)
74
- "LOOP_SEATTLE_5T", "bizitobs_l2c_5T", "redset_5T",
75
- "boomlet_1062", "boomlet_1209", "boomlet_1230", "boomlet_1487",
76
- # 10T (10 minutes)
77
- "jena_weather_10T", "kdd_cup_2022_10T",
78
- # 15T (15 minutes)
79
- "ETT_15T", "SZ_TAXI_15T", "entsoe_15T", "redset_15T", "solar_with_weather_15T",
80
- # 30T (30 minutes)
81
- "entsoe_30T", "kdd_cup_2022_30T", "boomlet_1631", "boomlet_1676",
82
- ],
83
- "Hourly": [
84
- "ETT_1H", "LOOP_SEATTLE_1H", "M_DENSE_1H", "SZ_TAXI_1H",
85
- "bizitobs_l2c_1H", "entsoe_1H", "ercot_1H",
86
- "epf_be", "epf_de", "epf_fr", "epf_np", "epf_pjm",
87
- "jena_weather_1H",
88
- "proenfo_gfc12", "proenfo_gfc14", "proenfo_gfc17",
89
- "redset_1H", "solar_with_weather_1H", "uci_air_quality_1H",
90
- "boomlet_1855", "boomlet_1975", "boomlet_2187",
91
- ],
92
- "Daily": [
93
- "ETT_1D", "LOOP_SEATTLE_1D", "M_DENSE_1D",
94
- "ercot_1D", "kdd_cup_2022_1D", "solar_1D",
95
- "favorita_stores_1D", "favorita_transactions_1D",
96
- "hierarchical_sales_1D", "m5_1D",
97
- "restaurant",
98
- "rohlik_orders_1D", "rohlik_sales_1D", "rossmann_1D",
99
- "jena_weather_1D", "uci_air_quality_1D",
100
- "hospital_admissions_1D",
101
- "uk_covid_nation_1D/cumulative", "uk_covid_nation_1D/new", "uk_covid_utla_1D/new",
102
- ],
103
- "Weekly": [
104
- "ETT_1W", "ercot_1W", "solar_1W",
105
- "favorita_stores_1W", "favorita_transactions_1W",
106
- "hierarchical_sales_1W", "m5_1W",
107
- "hermes", "walmart",
108
- "rohlik_orders_1W", "rohlik_sales_1W", "rossmann_1W",
109
- "ecdc_ili",
110
- "hospital_admissions_1W",
111
- "uk_covid_nation_1W/cumulative", "uk_covid_nation_1W/new", "uk_covid_utla_1W/cumulative",
112
- ],
113
- "Monthly+": [
114
- # Monthly
115
- "ercot_1M",
116
- "favorita_stores_1M", "favorita_transactions_1M", "m5_1M",
117
- "fred_md_2025/cee", "fred_md_2025/macro",
118
- "hospital",
119
- "us_consumption_1M",
120
- # Quarterly
121
- "australian_tourism", "gvar",
122
- "fred_qd_2025/cee", "fred_qd_2025/macro",
123
- "us_consumption_1Q",
124
- # Yearly
125
- "us_consumption_1Y",
126
- "world_co2_emissions", "world_life_expectancy", "world_tourism",
127
- ],
128
- }
129
-
130
- # Domain-based groupings
131
- DOMAIN_GROUPS = {
132
- "Energy": [
133
- "ETT_15T", "ETT_1D", "ETT_1H", "ETT_1W",
134
- "entsoe_15T", "entsoe_1H", "entsoe_30T",
135
- "epf_be", "epf_de", "epf_fr", "epf_np", "epf_pjm",
136
- "ercot_1D", "ercot_1H", "ercot_1M", "ercot_1W",
137
- "kdd_cup_2022_10T", "kdd_cup_2022_1D", "kdd_cup_2022_30T",
138
- "proenfo_gfc12", "proenfo_gfc14", "proenfo_gfc17",
139
- "solar_1D", "solar_1W", "solar_with_weather_15T", "solar_with_weather_1H",
140
- ],
141
- "Retail": [
142
- "favorita_stores_1D", "favorita_stores_1M", "favorita_stores_1W",
143
- "favorita_transactions_1D", "favorita_transactions_1M", "favorita_transactions_1W",
144
- "hermes",
145
- "hierarchical_sales_1D", "hierarchical_sales_1W",
146
- "m5_1D", "m5_1M", "m5_1W",
147
- "restaurant",
148
- "rohlik_orders_1D", "rohlik_orders_1W", "rohlik_sales_1D", "rohlik_sales_1W",
149
- "rossmann_1D", "rossmann_1W",
150
- "walmart",
151
- ],
152
- "Nature": [
153
- "jena_weather_10T", "jena_weather_1D", "jena_weather_1H",
154
- "uci_air_quality_1D", "uci_air_quality_1H",
155
- ],
156
- "Cloud": [
157
- "bizitobs_l2c_1H", "bizitobs_l2c_5T",
158
- "boomlet_1062", "boomlet_1209", "boomlet_1225", "boomlet_1230", "boomlet_1282",
159
- "boomlet_1487", "boomlet_1631", "boomlet_1676", "boomlet_1855", "boomlet_1975",
160
- "boomlet_2187", "boomlet_285", "boomlet_619", "boomlet_772", "boomlet_963",
161
- "redset_15T", "redset_1H", "redset_5T",
162
- ],
163
- "Health": [
164
- "ecdc_ili",
165
- "hospital", "hospital_admissions_1D", "hospital_admissions_1W",
166
- "uk_covid_nation_1D/cumulative", "uk_covid_nation_1D/new",
167
- "uk_covid_nation_1W/cumulative", "uk_covid_nation_1W/new",
168
- "uk_covid_utla_1D/new", "uk_covid_utla_1W/cumulative",
169
- ],
170
- "Econ": [
171
- "australian_tourism",
172
- "fred_md_2025/cee", "fred_md_2025/macro",
173
- "fred_qd_2025/cee", "fred_qd_2025/macro",
174
- "gvar",
175
- "us_consumption_1M", "us_consumption_1Q", "us_consumption_1Y",
176
- "world_co2_emissions", "world_life_expectancy", "world_tourism",
177
- ],
178
- "Mobility": [
179
- "LOOP_SEATTLE_1D", "LOOP_SEATTLE_1H", "LOOP_SEATTLE_5T",
180
- "M_DENSE_1D", "M_DENSE_1H",
181
- "SZ_TAXI_15T", "SZ_TAXI_1H",
182
- ],
183
- }
184
- # Task type groupings (overlapping: a multivariate task with covariates
185
- # belongs to both "Covariate-informed" and "Multivariate").
186
- # - Multivariate: target is a list of columns
187
- # - Covariate-informed: known_dynamic_columns or past_dynamic_columns is non-empty
188
- # - Univariate: neither of the above
189
- TASK_TYPE_GROUPS = {
190
- "Univariate": [
191
- "LOOP_SEATTLE_1D", "LOOP_SEATTLE_1H", "LOOP_SEATTLE_5T",
192
- "M_DENSE_1D", "M_DENSE_1H",
193
- "SZ_TAXI_15T", "SZ_TAXI_1H",
194
- "australian_tourism", "ecdc_ili",
195
- "ercot_1D", "ercot_1H", "ercot_1M", "ercot_1W",
196
- "hierarchical_sales_1D", "hierarchical_sales_1W",
197
- "hospital", "hospital_admissions_1D", "hospital_admissions_1W",
198
- "redset_15T", "redset_1H", "redset_5T",
199
- "restaurant",
200
- "solar_1D", "solar_1W",
201
- "uk_covid_utla_1D/new", "uk_covid_utla_1W/cumulative",
202
- "us_consumption_1M", "us_consumption_1Q", "us_consumption_1Y",
203
- "world_co2_emissions", "world_life_expectancy", "world_tourism",
204
- ],
205
- "Covariate-informed": [
206
- "entsoe_15T", "entsoe_1H", "entsoe_30T",
207
- "epf_be", "epf_de", "epf_fr", "epf_np", "epf_pjm",
208
- "favorita_stores_1D", "favorita_stores_1M", "favorita_stores_1W",
209
- "favorita_transactions_1D", "favorita_transactions_1M", "favorita_transactions_1W",
210
- "fred_md_2025/cee", "fred_qd_2025/cee",
211
- "gvar", "hermes",
212
- "kdd_cup_2022_10T", "kdd_cup_2022_1D", "kdd_cup_2022_30T",
213
- "m5_1D", "m5_1M", "m5_1W",
214
- "proenfo_gfc12", "proenfo_gfc14", "proenfo_gfc17",
215
- "rohlik_orders_1D", "rohlik_orders_1W", "rohlik_sales_1D", "rohlik_sales_1W",
216
- "rossmann_1D", "rossmann_1W",
217
- "solar_with_weather_15T", "solar_with_weather_1H",
218
- "uci_air_quality_1D", "uci_air_quality_1H",
219
- "uk_covid_nation_1D/cumulative", "uk_covid_nation_1D/new",
220
- "uk_covid_nation_1W/cumulative", "uk_covid_nation_1W/new",
221
- "walmart",
222
- ],
223
- "Multivariate": [
224
- "ETT_15T", "ETT_1D", "ETT_1H", "ETT_1W",
225
- "bizitobs_l2c_1H", "bizitobs_l2c_5T",
226
- "boomlet_1062", "boomlet_1209", "boomlet_1225", "boomlet_1230", "boomlet_1282",
227
- "boomlet_1487", "boomlet_1631", "boomlet_1676", "boomlet_1855", "boomlet_1975",
228
- "boomlet_2187", "boomlet_285", "boomlet_619", "boomlet_772", "boomlet_963",
229
- "fred_md_2025/cee", "fred_md_2025/macro", "fred_qd_2025/cee", "fred_qd_2025/macro",
230
- "gvar",
231
- "jena_weather_10T", "jena_weather_1D", "jena_weather_1H",
232
- "uci_air_quality_1D", "uci_air_quality_1H",
233
- "uk_covid_nation_1D/cumulative", "uk_covid_nation_1D/new",
234
- "uk_covid_nation_1W/cumulative", "uk_covid_nation_1W/new",
235
- ],
236
- }
237
-
238
-
239
- def get_task_group(group_type: str, group_value: str | None = None) -> list[str]:
240
- """Get the list of tasks for a given group type and value.
241
-
242
- Args:
243
- group_type: One of "full", "mini", "frequency", "domain", "task_type"
244
- group_value: Required for "frequency", "domain", and "task_type" types
245
-
246
- Returns:
247
- List of task names belonging to the group
248
- """
249
- if group_type == "full":
250
- return ALL_TASKS
251
- elif group_type == "mini":
252
- return MINI_TASKS
253
- elif group_type == "frequency":
254
- if group_value is None:
255
- raise ValueError("group_value required for frequency grouping")
256
- return FREQUENCY_GROUPS[group_value]
257
- elif group_type == "domain":
258
- if group_value is None:
259
- raise ValueError("group_value required for domain grouping")
260
- return DOMAIN_GROUPS[group_value]
261
- elif group_type == "task_type":
262
- if group_value is None:
263
- raise ValueError("group_value required for task_type grouping")
264
- return TASK_TYPE_GROUPS[group_value]
265
- else:
266
- raise ValueError(f"Unknown group_type: {group_type}")
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
src/utils.py DELETED
@@ -1,413 +0,0 @@
1
- import altair as alt
2
- import fev
3
- import pandas as pd
4
- import pandas.io.formats.style
5
-
6
- # Color constants - all colors defined in one place
7
-
8
- COLORS = {
9
- "pretrained_text": "#5A7FA5",
10
- "task_specific_text": "#7B5A9A",
11
- "statistical_text": "#A5795A",
12
- "bar_fill": "#8d5eb7",
13
- "error_bar": "#222222",
14
- "point": "#111111",
15
- "text_white": "white",
16
- "text_black": "black",
17
- "text_default": "#111",
18
- "gold": "#F7D36B",
19
- "silver": "#E5E7EB",
20
- "bronze": "#E6B089",
21
- "leakage_impute": "#3B82A0",
22
- "failure_impute": "#E07B39",
23
- }
24
- HEATMAP_COLOR_SCHEME = "purplegreen"
25
-
26
- # Model configuration: (url, org, zero_shot, model_type)
27
- MODEL_CONFIG = {
28
- # Chronos Models
29
- "chronos_tiny": ("amazon/chronos-t5-tiny", "AWS", True, "pretrained"),
30
- "chronos_mini": ("amazon/chronos-t5-mini", "AWS", True, "pretrained"),
31
- "chronos_small": ("amazon/chronos-t5-small", "AWS", True, "pretrained"),
32
- "chronos_base": ("amazon/chronos-t5-base", "AWS", True, "pretrained"),
33
- "chronos_large": ("amazon/chronos-t5-large", "AWS", True, "pretrained"),
34
- "chronos_bolt_tiny": ("amazon/chronos-bolt-tiny", "AWS", True, "pretrained"),
35
- "chronos_bolt_mini": ("amazon/chronos-bolt-mini", "AWS", True, "pretrained"),
36
- "chronos_bolt_small": ("amazon/chronos-bolt-small", "AWS", True, "pretrained"),
37
- "chronos_bolt_base": ("amazon/chronos-bolt-base", "AWS", True, "pretrained"),
38
- "chronos-bolt": ("amazon/chronos-bolt-base", "AWS", True, "pretrained"),
39
- "chronos-2": ("amazon/chronos-2", "AWS", True, "pretrained"),
40
- # Moirai Models
41
- "moirai_large": ("Salesforce/moirai-1.1-R-large", "Salesforce", True, "pretrained"),
42
- "moirai_base": ("Salesforce/moirai-1.1-R-base", "Salesforce", True, "pretrained"),
43
- "moirai_small": ("Salesforce/moirai-1.1-R-small", "Salesforce", True, "pretrained"),
44
- "moirai-2.0": ("Salesforce/moirai-2.0-R-small", "Salesforce", True, "pretrained"),
45
- # TimesFM Models
46
- "timesfm": ("google/timesfm-1.0-200m-pytorch", "Google", True, "pretrained"),
47
- "timesfm-2.0": ("google/timesfm-2.0-500m-pytorch", "Google", True, "pretrained"),
48
- "timesfm-2.5": ("google/timesfm-2.5-200m-pytorch", "Google", True, "pretrained"),
49
- # Toto Models
50
- "toto-1.0": ("Datadog/Toto-Open-Base-1.0", "Datadog", True, "pretrained"),
51
- "toto-2.0-2.5b": ("Datadog/Toto-2.0-2.5B", "Datadog", True, "pretrained"),
52
- "toto-2.0-22m": ("Datadog/Toto-2.0-22m", "Datadog", True, "pretrained"),
53
- # Other Models
54
- "tirex": ("NX-AI/TiRex", "NX-AI", True, "pretrained"),
55
- "tirex-2": ("NX-AI/TiRex-2-fevbench", "NX-AI", True, "pretrained"),
56
- "tabpfn-ts": ("Prior-Labs/TabPFN-v2-reg", "Prior Labs", True, "pretrained"),
57
- "tabpfn-ts-3": ("Prior-Labs/TabPFN-2.5-reg", "Prior Labs", True, "pretrained"),
58
- "sundial-base": ("thuml/sundial-base-128m", "Tsinghua University", True, "pretrained"),
59
- "ttm-r2": ("ibm-granite/granite-timeseries-ttm-r2", "IBM", True, "pretrained"),
60
- "flowstate": ("ibm-granite/granite-timeseries-flowstate-r1", "IBM", True, "pretrained"),
61
- # GluonTS Models
62
- "deepar": ("https://github.com/awslabs/gluonts", "—", False, "task-specific"),
63
- "tft": ("https://github.com/awslabs/gluonts", "—", False, "task-specific"),
64
- "patchtst": ("https://github.com/awslabs/gluonts", "—", False, "task-specific"),
65
- # MLForecast Models
66
- "lightgbm": ("https://nixtlaverse.nixtla.io/mlforecast", "—", False, "task-specific"),
67
- "catboost": ("https://nixtlaverse.nixtla.io/mlforecast", "—", False, "task-specific"),
68
- # Statistical models
69
- "stat. ensemble": (
70
- "https://nixtlaverse.nixtla.io/statsforecast/",
71
- "—",
72
- False,
73
- "statistical",
74
- ),
75
- "autoarima": ("https://nixtlaverse.nixtla.io/statsforecast/", "—", False, "statistical"),
76
- "autotheta": ("https://nixtlaverse.nixtla.io/statsforecast/", "—", False, "statistical"),
77
- "autoets": ("https://nixtlaverse.nixtla.io/statsforecast/", "—", False, "statistical"),
78
- "seasonalnaive": ("https://nixtlaverse.nixtla.io/statsforecast/", "—", False, "statistical"),
79
- "seasonal naive": (
80
- "https://nixtlaverse.nixtla.io/statsforecast/",
81
- "—",
82
- False,
83
- "statistical",
84
- ),
85
- "drift": ("https://nixtlaverse.nixtla.io/statsforecast/", "—", False, "statistical"),
86
- "naive": ("https://nixtlaverse.nixtla.io/statsforecast/", "—", False, "statistical"),
87
- }
88
-
89
-
90
- ALL_METRICS = {
91
- "SQL": (
92
- "SQL: Scaled Quantile Loss",
93
- "The [Scaled Quantile Loss (SQL)](https://auto.gluon.ai/dev/tutorials/timeseries/forecasting-metrics.html#autogluon.timeseries.metrics.SQL) is a **scale-invariant** metric for evaluating **probabilistic** forecasts.",
94
- ),
95
- "MASE": (
96
- "MASE: Mean Absolute Scaled Error",
97
- "The [Mean Absolute Scaled Error (MASE)](https://auto.gluon.ai/dev/tutorials/timeseries/forecasting-metrics.html#autogluon.timeseries.metrics.MASE) is a **scale-invariant** metric for evaluating **point** forecasts.",
98
- ),
99
- "WQL": (
100
- "WQL: Weighted Quantile Loss",
101
- "The [Weighted Quantile Loss (WQL)](https://auto.gluon.ai/dev/tutorials/timeseries/forecasting-metrics.html#autogluon.timeseries.metrics.WQL), is a **scale-dependent** metric for evaluating **probabilistic** forecasts.",
102
- ),
103
- "WAPE": (
104
- "WAPE: Weighted Absolute Percentage Error",
105
- "The [Weighted Absolute Percentage Error (WAPE)](https://auto.gluon.ai/dev/tutorials/timeseries/forecasting-metrics.html#autogluon.timeseries.metrics.WAPE) is a **scale-dependent** metric for evaluating **point** forecasts.",
106
- ),
107
- }
108
-
109
-
110
- def format_metric_name(metric_name: str):
111
- return ALL_METRICS[metric_name][0]
112
-
113
-
114
- def get_metric_description(metric_name: str):
115
- return ALL_METRICS[metric_name][1]
116
-
117
-
118
- # Models excluded from the leaderboard display (redundant Toto-2.0 sizes; keep 2.5B and 22m)
119
- HIDDEN_MODELS = ["Toto-2.0-1B", "Toto-2.0-313m", "Toto-2.0-4m"]
120
-
121
-
122
- def filter_hidden_models(df: pd.DataFrame, model_column: str = "model_name") -> pd.DataFrame:
123
- """Drop rows for models in HIDDEN_MODELS based on the given model-name column."""
124
- return df[~df[model_column].isin(HIDDEN_MODELS)]
125
-
126
-
127
- def validate_model_metadata(model_names) -> None:
128
- """Raise if any displayed model lacks a MODEL_CONFIG entry (organization, link, type, etc.)."""
129
- missing = sorted({m for m in model_names if MODEL_CONFIG.get(m.lower()) is None})
130
- if missing:
131
- raise ValueError(
132
- f"Missing MODEL_CONFIG metadata (organization, link, type) for models: {missing}. "
133
- "Add entries to MODEL_CONFIG in src/utils.py."
134
- )
135
-
136
-
137
- def get_model_link(model_name):
138
- config = MODEL_CONFIG.get(model_name.lower())
139
- if not config or not config[0]:
140
- return ""
141
- url = config[0]
142
- return url if url.startswith("https:") else f"https://huggingface.co/{url}"
143
-
144
-
145
- def get_model_organization(model_name):
146
- config = MODEL_CONFIG.get(model_name.lower())
147
- return config[1] if config else "—"
148
-
149
-
150
- def get_zero_shot_status(model_name):
151
- config = MODEL_CONFIG.get(model_name.lower())
152
- return "✓" if config and config[2] else "×"
153
-
154
-
155
- def get_model_type(model_name):
156
- config = MODEL_CONFIG.get(model_name.lower())
157
- return config[3] if config else "—"
158
-
159
-
160
- MODEL_TYPE_COLORS = {
161
- "pretrained": "pretrained_text",
162
- "task-specific": "task_specific_text",
163
- "statistical": "statistical_text",
164
- }
165
-
166
-
167
- def highlight_model_type_color(cell):
168
- config = MODEL_CONFIG.get(cell.lower())
169
- if config:
170
- color_key = MODEL_TYPE_COLORS.get(config[3], "text_default")
171
- return f"font-weight: bold; color: {COLORS[color_key]}"
172
- return "font-weight: bold"
173
-
174
-
175
- def format_leaderboard(df: pd.DataFrame):
176
- df = df.copy()
177
- df["skill_score"] = df["skill_score"].round(1)
178
- df["win_rate"] = df["win_rate"].round(1)
179
- df["zero_shot"] = df["model_name"].apply(get_zero_shot_status)
180
- # Format leakage column: convert to int for all models, 0 for non-zero-shot
181
- df["training_corpus_overlap"] = df.apply(
182
- lambda row: int(round(row["training_corpus_overlap"] * 100)) if row["zero_shot"] == "✓" else 0,
183
- axis=1,
184
- )
185
- df["link"] = df["model_name"].apply(get_model_link)
186
- df["org"] = df["model_name"].apply(get_model_organization)
187
- df = df[
188
- [
189
- "model_name",
190
- "win_rate",
191
- "skill_score",
192
- "median_inference_time_s_per100",
193
- "training_corpus_overlap",
194
- "num_failures",
195
- "zero_shot",
196
- "org",
197
- "link",
198
- ]
199
- ]
200
- return (
201
- df.style.map(highlight_model_type_color, subset=["model_name"])
202
- .map(lambda x: "font-weight: bold", subset=["zero_shot"])
203
- .apply(
204
- lambda x: ["background-color: #f8f9fa" if i % 2 == 1 else "" for i in range(len(x))],
205
- axis=0,
206
- )
207
- )
208
-
209
-
210
- def construct_bar_chart(df: pd.DataFrame, col: str, metric_name: str):
211
- label = "Skill Score" if col == "skill_score" else "Win Rate"
212
-
213
- tooltip = [
214
- alt.Tooltip("model_name:N"),
215
- alt.Tooltip(f"{col}:Q", format=".2f"),
216
- alt.Tooltip(f"{col}_lower:Q", title="95% CI Lower", format=".2f"),
217
- alt.Tooltip(f"{col}_upper:Q", title="95% CI Upper", format=".2f"),
218
- ]
219
-
220
- base_encode = {
221
- "y": alt.Y("model_name:N", title="Forecasting Model", sort=None),
222
- "tooltip": tooltip,
223
- }
224
-
225
- bars = (
226
- alt.Chart(df)
227
- .mark_bar(color=COLORS["bar_fill"], cornerRadius=4)
228
- .encode(
229
- x=alt.X(f"{col}:Q", title=f"{label} (%)", scale=alt.Scale(zero=False)),
230
- **base_encode,
231
- )
232
- )
233
-
234
- error_bars = (
235
- alt.Chart(df)
236
- .mark_errorbar(ticks={"height": 5}, color=COLORS["error_bar"])
237
- .encode(
238
- y=alt.Y("model_name:N", title=None, sort=None),
239
- x=alt.X(f"{col}_lower:Q", title=f"{label} (%)"),
240
- x2=alt.X2(f"{col}_upper:Q"),
241
- tooltip=tooltip,
242
- )
243
- )
244
-
245
- points = (
246
- alt.Chart(df)
247
- .mark_point(filled=True, color=COLORS["point"])
248
- .encode(x=alt.X(f"{col}:Q", title=f"{label} (%)"), **base_encode)
249
- )
250
-
251
- return (
252
- (bars + error_bars + points)
253
- .properties(height=500, title=f"{label} ({metric_name}) with 95% CIs")
254
- .configure_title(fontSize=16)
255
- )
256
-
257
-
258
- def construct_pairwise_chart(df: pd.DataFrame, col: str, metric_name: str):
259
- # Color ranges kept in sync with the fev repo's generate_fev_bench_figures.py
260
- config = {
261
- "win_rate": ("Win Rate", [0, 100], 50, f"abs(datum.{col} - 50) > 30"),
262
- "skill_score": ("Skill Score", [-30, 30], 0, f"abs(datum.{col}) > 20"),
263
- }
264
- cbar_label, domain, domain_mid, text_condition = config[col]
265
-
266
- df = df.copy()
267
- for c in [col, f"{col}_lower", f"{col}_upper"]:
268
- df[c] *= 100
269
-
270
- model_order = df.groupby("model_1")[col].mean().sort_values(ascending=False).index.tolist()
271
-
272
- tooltip = [
273
- alt.Tooltip("model_1:N", title="Model 1"),
274
- alt.Tooltip("model_2:N", title="Model 2"),
275
- alt.Tooltip(f"{col}:Q", title=cbar_label.split(" ")[0], format=".1f"),
276
- alt.Tooltip(f"{col}_lower:Q", title="95% CI Lower", format=".1f"),
277
- alt.Tooltip(f"{col}_upper:Q", title="95% CI Upper", format=".1f"),
278
- ]
279
-
280
- base = alt.Chart(df).encode(
281
- x=alt.X(
282
- "model_2:N",
283
- sort=model_order,
284
- title="Model 2",
285
- axis=alt.Axis(orient="top", labelAngle=-90),
286
- ),
287
- y=alt.Y("model_1:N", sort=model_order, title="Model 1"),
288
- )
289
-
290
- heatmap = base.mark_rect().encode(
291
- color=alt.Color(
292
- f"{col}:Q",
293
- legend=None,
294
- scale=alt.Scale(
295
- scheme=HEATMAP_COLOR_SCHEME,
296
- domain=domain,
297
- domainMid=domain_mid,
298
- clamp=True,
299
- ),
300
- ),
301
- tooltip=tooltip,
302
- )
303
-
304
- text_main = base.mark_text(dy=-8, fontSize=8, baseline="top", yOffset=5).encode(
305
- text=alt.Text(f"{col}:Q", format=".1f"),
306
- color=alt.condition(
307
- text_condition,
308
- alt.value(COLORS["text_white"]),
309
- alt.value(COLORS["text_black"]),
310
- ),
311
- tooltip=tooltip,
312
- )
313
-
314
- return (
315
- (heatmap + text_main)
316
- .properties(
317
- height=550,
318
- title={
319
- "text": f"Pairwise {cbar_label} ({metric_name}) with 95% CIs",
320
- "fontSize": 16,
321
- },
322
- )
323
- .configure_axis(labelFontSize=11, titleFontSize=13, titleFontWeight="bold")
324
- .resolve_scale(color="independent")
325
- )
326
-
327
-
328
- def construct_pivot_table_from_df(errors: pd.DataFrame, metric_name: str) -> pd.io.formats.style.Styler:
329
- """Construct styled pivot table from precomputed DataFrame."""
330
-
331
- def highlight_by_position(styler):
332
- rank_colors = {1: COLORS["gold"], 2: COLORS["silver"], 3: COLORS["bronze"]}
333
-
334
- for row_idx in errors.index:
335
- row_ranks = errors.loc[row_idx].rank(method="min")
336
- for col_idx in errors.columns:
337
- rank = row_ranks[col_idx]
338
- style_parts = []
339
-
340
- # Rank background colors
341
- if rank <= 3:
342
- style_parts.append(f"background-color: {rank_colors[rank]}")
343
- else:
344
- style_parts.append(f"color: {COLORS['text_default']}")
345
-
346
- if style_parts:
347
- styler = styler.map(
348
- lambda x, s="; ".join(style_parts): s,
349
- subset=pd.IndexSlice[row_idx:row_idx, col_idx:col_idx],
350
- )
351
- return styler
352
-
353
- return highlight_by_position(errors.style).format(precision=3)
354
-
355
-
356
- def construct_pivot_table(
357
- summaries: pd.DataFrame,
358
- metric_name: str,
359
- baseline_model: str,
360
- leakage_imputation_model: str,
361
- ) -> pd.io.formats.style.Styler:
362
- errors = fev.pivot_table(summaries=summaries, metric_column=metric_name, task_columns=["task_name"])
363
- train_overlap = (
364
- fev.pivot_table(
365
- summaries=summaries,
366
- metric_column="trained_on_this_dataset",
367
- task_columns=["task_name"],
368
- )
369
- .fillna(False)
370
- .astype(bool)
371
- )
372
-
373
- is_imputed_baseline = errors.isna()
374
- is_leakage_imputed = train_overlap
375
-
376
- # Handle imputations
377
- errors = errors.mask(train_overlap, errors[leakage_imputation_model], axis=0)
378
- for col in errors.columns:
379
- if col != baseline_model:
380
- errors[col] = errors[col].fillna(errors[baseline_model])
381
-
382
- errors = errors[errors.rank(axis=1).mean().sort_values().index]
383
- errors.index.rename("Task name", inplace=True)
384
-
385
- def highlight_by_position(styler):
386
- rank_colors = {1: COLORS["gold"], 2: COLORS["silver"], 3: COLORS["bronze"]}
387
-
388
- for row_idx in errors.index:
389
- row_ranks = errors.loc[row_idx].rank(method="min")
390
- for col_idx in errors.columns:
391
- rank = row_ranks[col_idx]
392
- style_parts = []
393
-
394
- # Rank background colors
395
- if rank <= 3:
396
- style_parts.append(f"background-color: {rank_colors[rank]}")
397
-
398
- # Imputation text colors
399
- if is_leakage_imputed.loc[row_idx, col_idx]:
400
- style_parts.append(f"color: {COLORS['leakage_impute']}")
401
- elif is_imputed_baseline.loc[row_idx, col_idx]:
402
- style_parts.append(f"color: {COLORS['failure_impute']}")
403
- elif not style_parts or (len(style_parts) == 1 and "font-weight" in style_parts[0]):
404
- style_parts.append(f"color: {COLORS['text_default']}")
405
-
406
- if style_parts:
407
- styler = styler.map(
408
- lambda x, s="; ".join(style_parts): s,
409
- subset=pd.IndexSlice[row_idx:row_idx, col_idx:col_idx],
410
- )
411
- return styler
412
-
413
- return highlight_by_position(errors.style).format(precision=3)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_cloud/leaderboard_MASE.csv DELETED
@@ -1,29 +0,0 @@
1
- model_name,win_rate,skill_score,median_training_time_s_per100,median_inference_time_s_per100,training_corpus_overlap,num_failures
2
- Toto-2.0-2.5B,96.11111111111113,47.105140103596796,0.0,5.064579399732653,0.0,0.0
3
- Toto-2.0-1B,95.37037037037037,47.049179559947774,0.0,2.3743196950416188,0.0,0.0
4
- Toto-2.0-313m,92.4074074074074,46.485472580621256,0.0,0.9745701860666667,0.0,0.0
5
- Toto-2.0-22m,84.25925925925925,43.92623198246986,0.0,0.13920661274489796,0.0,0.0
6
- Toto-1.0,78.70370370370371,41.88927928450025,0.0,45.854219394249995,0.0,0.0
7
- Chronos-2,75.55555555555556,42.51579967639686,0.0,1.1862588189,0.0,0.0
8
- Toto-2.0-4m,73.51851851851853,40.931171483779714,0.0,0.09261558033545919,0.0,0.0
9
- TimesFM-2.5,69.44444444444444,40.26605676264323,0.0,6.434508300230608,0.0,0.0
10
- TiRex-2,67.96296296296298,39.65417127595432,0.0,0.19312244271691675,0.0,0.0
11
- TiRex,64.81481481481481,38.09940061802194,0.0,0.20884203875396826,0.0,0.0
12
- Moirai-2.0,52.03703703703704,35.5798994200739,0.0,0.35171731723214283,0.1,0.0
13
- FlowState,51.66666666666666,30.68598311802213,0.0,12.472611368300264,0.0,0.0
14
- TabPFN-TS-3,50.74074074074074,34.02528132692776,0.0,431.5150328579276,0.0,0.0
15
- PatchTST,48.51851851851852,34.304846616783294,1068.4652680383783,0.7892402496428571,0.0,0.0
16
- TFT,48.425925925925924,34.39379489295074,1003.5120332510221,1.1076982505700976,0.0,0.0
17
- Sundial-Base,48.14814814814816,34.444932595485724,0.0,7.874095355196429,0.0,0.0
18
- Chronos-Bolt,46.11111111111111,30.890375949929528,0.0,0.21284866287857143,0.0,0.0
19
- TabPFN-TS,44.25925925925926,31.182648441489537,0.0,285.2805137923404,0.0,0.0
20
- CatBoost,40.74074074074074,28.99041616417205,123.37088255733154,0.43462186795918367,0.0,0.0
21
- DeepAR,36.48148148148148,25.641579380120593,1590.4637105111146,1.558186748969388,0.0,0.0
22
- LightGBM,30.185185185185183,21.217567102831968,7.053590123430682,0.3469036807346939,0.0,0.0
23
- Stat. Ensemble,23.98148148148148,12.457381191619765,0.0,140.07917045413043,0.0,5.0
24
- AutoARIMA,21.38888888888889,13.156560456056853,0.0,18.324502920714288,0.0,5.0
25
- AutoETS,15.64814814814815,9.008132945543156,0.0,2.9907604154761906,0.0,15.0
26
- AutoTheta,15.555555555555555,6.832233363582574,0.0,4.0546638315458425,0.0,0.0
27
- Naive,12.77777777777778,-25.50199781747715,0.0,0.43933051720441596,0.0,0.0
28
- Seasonal Naive,10.37037037037037,0.0,0.0,0.5176203110585994,0.0,0.0
29
- Drift,4.814814814814815,-32.85429098273796,0.0,0.4190869192562794,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_cloud/leaderboard_SQL.csv DELETED
@@ -1,29 +0,0 @@
1
- model_name,win_rate,skill_score,median_training_time_s_per100,median_inference_time_s_per100,training_corpus_overlap,num_failures
2
- Toto-2.0-2.5B,97.03703703703704,66.67609437659667,0.0,5.064579399732653,0.0,0.0
3
- Toto-2.0-1B,95.55555555555557,66.67229326421315,0.0,2.3743196950416188,0.0,0.0
4
- Toto-2.0-313m,92.77777777777779,66.42835118245338,0.0,0.9745701860666667,0.0,0.0
5
- Toto-2.0-22m,85.74074074074073,64.64905946685398,0.0,0.13920661274489796,0.0,0.0
6
- Toto-1.0,78.70370370370368,63.05875031595707,0.0,45.854219394249995,0.0,0.0
7
- Chronos-2,76.4814814814815,63.92789670076326,0.0,1.1862588189,0.0,0.0
8
- Toto-2.0-4m,75.0,62.51740509789393,0.0,0.09261558033545919,0.0,0.0
9
- TiRex-2,70.74074074074075,61.657338261486025,0.0,0.19312244271691675,0.0,0.0
10
- TimesFM-2.5,69.81481481481482,61.98663035039822,0.0,6.434508300230608,0.0,0.0
11
- TiRex,66.48148148148148,60.871565834690514,0.0,0.20884203875396826,0.0,0.0
12
- TabPFN-TS-3,57.59259259259261,59.42246884042356,0.0,431.5150328579276,0.0,0.0
13
- Moirai-2.0,54.44444444444445,58.416109773202194,0.0,0.35171731723214283,0.1,0.0
14
- FlowState,53.51851851851852,55.917373913965896,0.0,12.472611368300264,0.0,0.0
15
- PatchTST,49.351851851851855,56.65838528437654,1068.4652680383783,0.7892402496428571,0.0,0.0
16
- TFT,48.51851851851852,56.101100728840805,1003.5120332510221,1.1076982505700976,0.0,0.0
17
- Sundial-Base,45.37037037037038,56.64773521043558,0.0,7.874095355196429,0.0,0.0
18
- Chronos-Bolt,45.370370370370374,54.85929046462743,0.0,0.21284866287857143,0.0,0.0
19
- TabPFN-TS,43.7037037037037,54.882167458139385,0.0,285.2805137923404,0.0,0.0
20
- DeepAR,38.7962962962963,50.20430422932948,1590.4637105111146,1.558186748969388,0.0,0.0
21
- CatBoost,31.85185185185186,46.25315473529981,123.37088255733154,0.43462186795918367,0.0,0.0
22
- LightGBM,25.740740740740737,40.369919076130486,7.053590123430682,0.3469036807346939,0.0,0.0
23
- AutoARIMA,25.092592592592595,34.1099179045811,0.0,18.324502920714288,0.0,5.0
24
- Stat. Ensemble,22.499999999999996,21.741616773476768,0.0,140.07917045413043,0.0,5.0
25
- AutoETS,16.01851851851852,-26.853793282334813,0.0,2.9907604154761906,0.0,15.0
26
- AutoTheta,11.851851851851853,-2.114517117703918,0.0,4.0546638315458425,0.0,0.0
27
- Seasonal Naive,11.759259259259258,0.0,0.0,0.5176203110585994,0.0,0.0
28
- Naive,7.962962962962965,-102.14853947002402,0.0,0.43933051720441596,0.0,0.0
29
- Drift,2.2222222222222228,-110.24318719846286,0.0,0.4190869192562794,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_cloud/leaderboard_WAPE.csv DELETED
@@ -1,29 +0,0 @@
1
- model_name,win_rate,skill_score,median_training_time_s_per100,median_inference_time_s_per100,training_corpus_overlap,num_failures
2
- Toto-2.0-2.5B,97.03703703703704,53.71035361627254,0.0,5.064579399732653,0.0,0.0
3
- Toto-2.0-1B,95.37037037037038,53.096830919470946,0.0,2.3743196950416188,0.0,0.0
4
- Toto-2.0-313m,93.14814814814815,52.69411150627982,0.0,0.9745701860666667,0.0,0.0
5
- Toto-2.0-22m,85.92592592592592,50.191472774349634,0.0,0.13920661274489796,0.0,0.0
6
- Chronos-2,78.14814814814817,50.57276323971893,0.0,1.1862588189,0.0,0.0
7
- Toto-1.0,77.5925925925926,47.09252281338565,0.0,45.854219394249995,0.0,0.0
8
- Toto-2.0-4m,72.96296296296298,47.10219495180865,0.0,0.09261558033545919,0.0,0.0
9
- TiRex-2,68.33333333333333,46.55373683052376,0.0,0.19312244271691675,0.0,0.0
10
- TimesFM-2.5,68.14814814814817,46.24771958720855,0.0,6.434508300230608,0.0,0.0
11
- TiRex,63.888888888888886,44.520635260445665,0.0,0.20884203875396826,0.0,0.0
12
- TabPFN-TS-3,56.85185185185186,46.210313482546184,0.0,431.5150328579276,0.0,0.0
13
- FlowState,56.11111111111112,44.39308253523333,0.0,12.472611368300264,0.0,0.0
14
- Moirai-2.0,53.51851851851852,42.79254856807111,0.0,0.35171731723214283,0.1,0.0
15
- TabPFN-TS,50.37037037037037,42.304181829008726,0.0,285.2805137923404,0.0,0.0
16
- PatchTST,49.07407407407408,42.75818805959519,1068.4652680383783,0.7892402496428571,0.0,0.0
17
- Sundial-Base,47.5925925925926,41.966358434053696,0.0,7.874095355196429,0.0,0.0
18
- Chronos-Bolt,47.22222222222222,39.89366883509092,0.0,0.21284866287857143,0.0,0.0
19
- TFT,45.46296296296297,37.9920627846737,1003.5120332510221,1.1076982505700976,0.0,0.0
20
- CatBoost,37.03703703703704,34.58752644878078,123.37088255733154,0.43462186795918367,0.0,0.0
21
- DeepAR,36.11111111111111,31.125782577257844,1590.4637105111146,1.558186748969388,0.0,0.0
22
- LightGBM,29.074074074074076,27.03716130150796,7.053590123430682,0.3469036807346939,0.0,0.0
23
- Stat. Ensemble,21.38888888888889,17.59542897915567,0.0,140.07917045413043,0.0,5.0
24
- AutoARIMA,18.425925925925924,16.5309827995087,0.0,18.324502920714288,0.0,5.0
25
- AutoETS,14.351851851851851,5.6618608202705705,0.0,2.9907604154761906,0.0,15.0
26
- AutoTheta,12.77777777777778,12.660865320459136,0.0,4.0546638315458425,0.0,0.0
27
- Naive,12.222222222222221,4.49837321934039,0.0,0.43933051720441596,0.0,0.0
28
- Seasonal Naive,7.4074074074074066,0.0,0.0,0.5176203110585994,0.0,0.0
29
- Drift,4.4444444444444455,-1.7537853153904326,0.0,0.4190869192562794,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_cloud/leaderboard_WQL.csv DELETED
@@ -1,29 +0,0 @@
1
- model_name,win_rate,skill_score,median_training_time_s_per100,median_inference_time_s_per100,training_corpus_overlap,num_failures
2
- Toto-2.0-2.5B,97.96296296296296,69.03469555605878,0.0,5.064579399732653,0.0,0.0
3
- Toto-2.0-1B,95.74074074074075,68.75529346896873,0.0,2.3743196950416188,0.0,0.0
4
- Toto-2.0-313m,92.5925925925926,68.41066967488192,0.0,0.9745701860666667,0.0,0.0
5
- Toto-2.0-22m,86.11111111111111,66.78327813931047,0.0,0.13920661274489796,0.0,0.0
6
- Chronos-2,78.70370370370372,66.94397676250325,0.0,1.1862588189,0.0,0.0
7
- Toto-1.0,76.2962962962963,64.46135334372015,0.0,45.854219394249995,0.0,0.0
8
- Toto-2.0-4m,73.88888888888887,64.42603072886158,0.0,0.09261558033545919,0.0,0.0
9
- TiRex-2,70.37037037037037,63.99709672683953,0.0,0.19312244271691675,0.0,0.0
10
- TimesFM-2.5,67.77777777777779,63.7537487246866,0.0,6.434508300230608,0.0,0.0
11
- TiRex,66.29629629629629,62.74382048246822,0.0,0.20884203875396826,0.0,0.0
12
- TabPFN-TS-3,61.66666666666669,64.3601359782909,0.0,431.5150328579276,0.0,0.0
13
- FlowState,58.518518518518526,62.649468493586056,0.0,12.472611368300264,0.0,0.0
14
- Moirai-2.0,55.37037037037037,61.08750954950368,0.0,0.35171731723214283,0.1,0.0
15
- PatchTST,50.64814814814817,59.71037333425973,1068.4652680383783,0.7892402496428571,0.0,0.0
16
- TFT,47.77777777777778,55.556509382143545,1003.5120332510221,1.1076982505700976,0.0,0.0
17
- TabPFN-TS,46.2962962962963,58.432181218600874,0.0,285.2805137923404,0.0,0.0
18
- Chronos-Bolt,45.18518518518518,58.15816295699815,0.0,0.21284866287857143,0.0,0.0
19
- Sundial-Base,43.88888888888889,59.21372871831863,0.0,7.874095355196429,0.0,0.0
20
- DeepAR,38.425925925925924,50.79429174981283,1590.4637105111146,1.558186748969388,0.0,0.0
21
- CatBoost,31.48148148148148,46.843426009989976,123.37088255733154,0.43462186795918367,0.0,0.0
22
- LightGBM,26.481481481481485,40.70772252024998,7.053590123430682,0.3469036807346939,0.0,0.0
23
- AutoARIMA,23.240740740740744,34.821696297938075,0.0,18.324502920714288,0.0,5.0
24
- Stat. Ensemble,20.09259259259259,22.34504540092107,0.0,140.07917045413043,0.0,5.0
25
- AutoETS,13.425925925925927,-39.995047645386684,0.0,2.9907604154761906,0.0,15.0
26
- AutoTheta,11.48148148148148,7.361982676335321,0.0,4.0546638315458425,0.0,0.0
27
- Seasonal Naive,10.648148148148149,0.0,0.0,0.5176203110585994,0.0,0.0
28
- Naive,7.222222222222223,-64.9788901369484,0.0,0.43933051720441596,0.0,0.0
29
- Drift,2.407407407407407,-71.7471743825873,0.0,0.4190869192562794,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_cloud/pairwise_MASE.csv DELETED
@@ -1,290 +0,0 @@
1
- model_1,model_2,win_rate,win_rate_lower,win_rate_upper,skill_score,skill_score_lower,skill_score_upper
2
- Toto-2.0-2.5B,Toto-2.0-2.5B,0.5,0.5,0.5,0.0,0.0,0.0
3
- Toto-2.0-2.5B,Toto-2.0-1B,0.6,0.4,0.8,0.001,-0.011,0.012
4
- Toto-2.0-2.5B,Toto-2.0-313m,0.8,0.6,0.95,0.012,0.002,0.024
5
- Toto-2.0-2.5B,Toto-2.0-22m,1.0,1.0,1.0,0.057,0.031,0.088
6
- Toto-2.0-2.5B,Toto-1.0,0.95,0.85,1.0,0.09,0.05,0.136
7
- Toto-2.0-2.5B,Chronos-2,0.95,0.85,1.0,0.08,0.048,0.124
8
- Toto-2.0-2.5B,Toto-2.0-4m,1.0,1.0,1.0,0.105,0.061,0.155
9
- Toto-2.0-2.5B,TiRex-2,0.95,0.85,1.0,0.123,0.077,0.173
10
- Toto-2.0-2.5B,TimesFM-2.5,0.95,0.85,1.0,0.114,0.07,0.181
11
- Toto-2.0-2.5B,TiRex,1.0,1.0,1.0,0.145,0.082,0.223
12
- Toto-2.0-2.5B,FlowState,0.9,0.75,1.0,0.237,0.125,0.356
13
- Toto-2.0-2.5B,Moirai-2.0,1.0,1.0,1.0,0.179,0.114,0.268
14
- Toto-2.0-2.5B,TabPFN-TS-3,0.95,0.85,1.0,0.198,0.107,0.308
15
- Toto-2.0-2.5B,TFT,1.0,1.0,1.0,0.194,0.136,0.259
16
- Toto-2.0-2.5B,PatchTST,0.95,0.85,1.0,0.195,0.12,0.276
17
- Toto-2.0-2.5B,Chronos-Bolt,1.0,1.0,1.0,0.235,0.163,0.308
18
- Toto-2.0-2.5B,Seasonal Naive,1.0,1.0,1.0,0.471,0.37,0.587
19
- Toto-2.0-1B,Toto-2.0-2.5B,0.4,0.2,0.6,-0.001,-0.012,0.011
20
- Toto-2.0-1B,Toto-2.0-1B,0.5,0.5,0.5,0.0,0.0,0.0
21
- Toto-2.0-1B,Toto-2.0-313m,0.8,0.6,0.95,0.011,0.001,0.022
22
- Toto-2.0-1B,Toto-2.0-22m,1.0,1.0,1.0,0.056,0.028,0.092
23
- Toto-2.0-1B,Toto-1.0,1.0,1.0,1.0,0.089,0.051,0.132
24
- Toto-2.0-1B,Chronos-2,0.95,0.85,1.0,0.079,0.042,0.127
25
- Toto-2.0-1B,Toto-2.0-4m,1.0,1.0,1.0,0.104,0.06,0.157
26
- Toto-2.0-1B,TiRex-2,0.95,0.85,1.0,0.123,0.077,0.175
27
- Toto-2.0-1B,TimesFM-2.5,0.9,0.75,1.0,0.114,0.068,0.183
28
- Toto-2.0-1B,TiRex,1.0,1.0,1.0,0.145,0.084,0.223
29
- Toto-2.0-1B,FlowState,0.9,0.75,1.0,0.236,0.115,0.36
30
- Toto-2.0-1B,Moirai-2.0,1.0,1.0,1.0,0.178,0.112,0.271
31
- Toto-2.0-1B,TabPFN-TS-3,0.95,0.85,1.0,0.197,0.101,0.318
32
- Toto-2.0-1B,TFT,1.0,1.0,1.0,0.193,0.137,0.254
33
- Toto-2.0-1B,PatchTST,0.95,0.85,1.0,0.194,0.117,0.277
34
- Toto-2.0-1B,Chronos-Bolt,1.0,1.0,1.0,0.234,0.16,0.311
35
- Toto-2.0-1B,Seasonal Naive,1.0,1.0,1.0,0.47,0.372,0.586
36
- Toto-2.0-313m,Toto-2.0-2.5B,0.2,0.05,0.4,-0.012,-0.024,-0.002
37
- Toto-2.0-313m,Toto-2.0-1B,0.2,0.05,0.4,-0.011,-0.023,-0.001
38
- Toto-2.0-313m,Toto-2.0-313m,0.5,0.5,0.5,0.0,0.0,0.0
39
- Toto-2.0-313m,Toto-2.0-22m,1.0,1.0,1.0,0.046,0.025,0.076
40
- Toto-2.0-313m,Toto-1.0,0.95,0.85,1.0,0.079,0.045,0.121
41
- Toto-2.0-313m,Chronos-2,0.95,0.85,1.0,0.069,0.033,0.115
42
- Toto-2.0-313m,Toto-2.0-4m,1.0,1.0,1.0,0.094,0.056,0.144
43
- Toto-2.0-313m,TiRex-2,0.95,0.85,1.0,0.113,0.073,0.158
44
- Toto-2.0-313m,TimesFM-2.5,0.95,0.85,1.0,0.104,0.058,0.173
45
- Toto-2.0-313m,TiRex,1.0,1.0,1.0,0.135,0.076,0.212
46
- Toto-2.0-313m,FlowState,0.9,0.75,1.0,0.228,0.113,0.349
47
- Toto-2.0-313m,Moirai-2.0,1.0,1.0,1.0,0.169,0.107,0.26
48
- Toto-2.0-313m,TabPFN-TS-3,0.95,0.85,1.0,0.189,0.093,0.302
49
- Toto-2.0-313m,TFT,1.0,1.0,1.0,0.184,0.131,0.249
50
- Toto-2.0-313m,PatchTST,0.95,0.85,1.0,0.185,0.105,0.268
51
- Toto-2.0-313m,Chronos-Bolt,1.0,1.0,1.0,0.226,0.157,0.3
52
- Toto-2.0-313m,Seasonal Naive,1.0,1.0,1.0,0.465,0.364,0.583
53
- Toto-2.0-22m,Toto-2.0-2.5B,0.0,0.0,0.0,-0.06,-0.096,-0.032
54
- Toto-2.0-22m,Toto-2.0-1B,0.0,0.0,0.0,-0.059,-0.102,-0.029
55
- Toto-2.0-22m,Toto-2.0-313m,0.0,0.0,0.0,-0.048,-0.082,-0.026
56
- Toto-2.0-22m,Toto-2.0-22m,0.5,0.5,0.5,0.0,0.0,0.0
57
- Toto-2.0-22m,Toto-1.0,0.75,0.55,0.9,0.035,0.012,0.064
58
- Toto-2.0-22m,Chronos-2,0.85,0.7,1.0,0.025,-0.013,0.052
59
- Toto-2.0-22m,Toto-2.0-4m,1.0,1.0,1.0,0.051,0.03,0.076
60
- Toto-2.0-22m,TiRex-2,0.9,0.75,1.0,0.071,0.046,0.096
61
- Toto-2.0-22m,TimesFM-2.5,0.85,0.699,1.0,0.061,0.016,0.111
62
- Toto-2.0-22m,TiRex,0.85,0.7,1.0,0.094,0.047,0.149
63
- Toto-2.0-22m,FlowState,0.9,0.75,1.0,0.191,0.077,0.306
64
- Toto-2.0-22m,Moirai-2.0,1.0,1.0,1.0,0.13,0.081,0.2
65
- Toto-2.0-22m,TabPFN-TS-3,0.95,0.85,1.0,0.15,0.058,0.249
66
- Toto-2.0-22m,TFT,1.0,1.0,1.0,0.145,0.093,0.21
67
- Toto-2.0-22m,PatchTST,0.9,0.75,1.0,0.146,0.069,0.221
68
- Toto-2.0-22m,Chronos-Bolt,1.0,1.0,1.0,0.189,0.128,0.252
69
- Toto-2.0-22m,Seasonal Naive,1.0,1.0,1.0,0.439,0.34,0.551
70
- Toto-1.0,Toto-2.0-2.5B,0.05,0.0,0.15,-0.099,-0.157,-0.052
71
- Toto-1.0,Toto-2.0-1B,0.0,0.0,0.0,-0.097,-0.152,-0.053
72
- Toto-1.0,Toto-2.0-313m,0.05,0.0,0.15,-0.086,-0.138,-0.047
73
- Toto-1.0,Toto-2.0-22m,0.25,0.1,0.45,-0.036,-0.068,-0.012
74
- Toto-1.0,Toto-1.0,0.5,0.5,0.5,0.0,0.0,0.0
75
- Toto-1.0,Chronos-2,0.65,0.45,0.85,-0.011,-0.063,0.027
76
- Toto-1.0,Toto-2.0-4m,0.7,0.45,0.9,0.016,-0.007,0.04
77
- Toto-1.0,TiRex-2,0.85,0.7,1.0,0.037,0.014,0.059
78
- Toto-1.0,TimesFM-2.5,0.7,0.5,0.9,0.027,-0.02,0.072
79
- Toto-1.0,TiRex,0.8,0.6,0.95,0.061,0.027,0.114
80
- Toto-1.0,FlowState,0.85,0.7,1.0,0.162,0.041,0.286
81
- Toto-1.0,Moirai-2.0,0.95,0.85,1.0,0.098,0.052,0.164
82
- Toto-1.0,TabPFN-TS-3,0.95,0.85,1.0,0.119,0.024,0.226
83
- Toto-1.0,TFT,0.9,0.75,1.0,0.114,0.071,0.159
84
- Toto-1.0,PatchTST,0.9,0.75,1.0,0.115,0.034,0.185
85
- Toto-1.0,Chronos-Bolt,0.9,0.75,1.0,0.159,0.094,0.224
86
- Toto-1.0,Seasonal Naive,1.0,1.0,1.0,0.419,0.323,0.528
87
- Chronos-2,Toto-2.0-2.5B,0.05,0.0,0.15,-0.087,-0.141,-0.05
88
- Chronos-2,Toto-2.0-1B,0.05,0.0,0.15,-0.086,-0.145,-0.044
89
- Chronos-2,Toto-2.0-313m,0.05,0.0,0.15,-0.074,-0.13,-0.034
90
- Chronos-2,Toto-2.0-22m,0.15,0.0,0.3,-0.025,-0.055,0.013
91
- Chronos-2,Toto-1.0,0.35,0.15,0.55,0.011,-0.028,0.059
92
- Chronos-2,Chronos-2,0.5,0.5,0.5,0.0,0.0,0.0
93
- Chronos-2,Toto-2.0-4m,0.6,0.35,0.8,0.027,-0.006,0.067
94
- Chronos-2,TiRex-2,0.7,0.5,0.9,0.047,0.011,0.093
95
- Chronos-2,TimesFM-2.5,0.7,0.5,0.9,0.038,0.009,0.071
96
- Chronos-2,TiRex,0.75,0.55,0.95,0.071,0.022,0.128
97
- Chronos-2,FlowState,0.8,0.6,0.95,0.171,0.067,0.29
98
- Chronos-2,Moirai-2.0,1.0,1.0,1.0,0.108,0.053,0.168
99
- Chronos-2,TabPFN-TS-3,0.8,0.6,0.95,0.129,0.052,0.222
100
- Chronos-2,TFT,0.85,0.699,1.0,0.124,0.065,0.193
101
- Chronos-2,PatchTST,0.9,0.75,1.0,0.125,0.065,0.189
102
- Chronos-2,Chronos-Bolt,0.95,0.85,1.0,0.168,0.101,0.231
103
- Chronos-2,Seasonal Naive,1.0,1.0,1.0,0.425,0.331,0.534
104
- Toto-2.0-4m,Toto-2.0-2.5B,0.0,0.0,0.0,-0.117,-0.184,-0.065
105
- Toto-2.0-4m,Toto-2.0-1B,0.0,0.0,0.0,-0.116,-0.187,-0.064
106
- Toto-2.0-4m,Toto-2.0-313m,0.0,0.0,0.0,-0.104,-0.168,-0.059
107
- Toto-2.0-4m,Toto-2.0-22m,0.0,0.0,0.0,-0.053,-0.083,-0.031
108
- Toto-2.0-4m,Toto-1.0,0.3,0.1,0.55,-0.016,-0.042,0.007
109
- Toto-2.0-4m,Chronos-2,0.4,0.2,0.65,-0.028,-0.072,0.006
110
- Toto-2.0-4m,Toto-2.0-4m,0.5,0.5,0.5,0.0,0.0,0.0
111
- Toto-2.0-4m,TiRex-2,0.85,0.65,1.0,0.021,0.008,0.034
112
- Toto-2.0-4m,TimesFM-2.5,0.65,0.4,0.85,0.011,-0.032,0.048
113
- Toto-2.0-4m,TiRex,0.75,0.55,0.9,0.046,0.017,0.083
114
- Toto-2.0-4m,FlowState,0.85,0.699,1.0,0.148,0.032,0.269
115
- Toto-2.0-4m,Moirai-2.0,1.0,1.0,1.0,0.083,0.05,0.134
116
- Toto-2.0-4m,TabPFN-TS-3,0.9,0.75,1.0,0.105,0.014,0.197
117
- Toto-2.0-4m,TFT,0.9,0.75,1.0,0.1,0.046,0.16
118
- Toto-2.0-4m,PatchTST,0.85,0.699,1.0,0.101,0.019,0.165
119
- Toto-2.0-4m,Chronos-Bolt,1.0,1.0,1.0,0.145,0.092,0.201
120
- Toto-2.0-4m,Seasonal Naive,0.95,0.85,1.0,0.409,0.315,0.516
121
- TiRex-2,Toto-2.0-2.5B,0.05,0.0,0.15,-0.141,-0.209,-0.084
122
- TiRex-2,Toto-2.0-1B,0.05,0.0,0.15,-0.14,-0.212,-0.083
123
- TiRex-2,Toto-2.0-313m,0.05,0.0,0.15,-0.128,-0.188,-0.078
124
- TiRex-2,Toto-2.0-22m,0.1,0.0,0.25,-0.076,-0.106,-0.049
125
- TiRex-2,Toto-1.0,0.15,0.0,0.3,-0.038,-0.063,-0.014
126
- TiRex-2,Chronos-2,0.3,0.1,0.5,-0.05,-0.103,-0.011
127
- TiRex-2,Toto-2.0-4m,0.15,0.0,0.35,-0.022,-0.035,-0.008
128
- TiRex-2,TiRex-2,0.5,0.5,0.5,0.0,0.0,0.0
129
- TiRex-2,TimesFM-2.5,0.6,0.4,0.8,-0.01,-0.061,0.036
130
- TiRex-2,TiRex,0.65,0.45,0.85,0.025,-0.006,0.072
131
- TiRex-2,FlowState,0.8,0.6,0.95,0.129,0.009,0.25
132
- TiRex-2,Moirai-2.0,0.85,0.7,1.0,0.063,0.027,0.121
133
- TiRex-2,TabPFN-TS-3,0.85,0.7,1.0,0.085,-0.01,0.184
134
- TiRex-2,TFT,0.8,0.6,0.95,0.08,0.03,0.141
135
- TiRex-2,PatchTST,0.9,0.75,1.0,0.081,-0.011,0.149
136
- TiRex-2,Chronos-Bolt,0.95,0.85,1.0,0.127,0.072,0.184
137
- TiRex-2,Seasonal Naive,0.95,0.85,1.0,0.397,0.293,0.51
138
- TimesFM-2.5,Toto-2.0-2.5B,0.05,0.0,0.15,-0.129,-0.22,-0.075
139
- TimesFM-2.5,Toto-2.0-1B,0.1,0.0,0.25,-0.128,-0.224,-0.073
140
- TimesFM-2.5,Toto-2.0-313m,0.05,0.0,0.15,-0.116,-0.209,-0.061
141
- TimesFM-2.5,Toto-2.0-22m,0.15,0.0,0.301,-0.065,-0.125,-0.016
142
- TimesFM-2.5,Toto-1.0,0.3,0.1,0.5,-0.028,-0.078,0.02
143
- TimesFM-2.5,Chronos-2,0.3,0.1,0.5,-0.039,-0.077,-0.009
144
- TimesFM-2.5,Toto-2.0-4m,0.35,0.15,0.6,-0.011,-0.05,0.031
145
- TimesFM-2.5,TiRex-2,0.4,0.2,0.6,0.01,-0.037,0.058
146
- TimesFM-2.5,TimesFM-2.5,0.5,0.5,0.5,0.0,0.0,0.0
147
- TimesFM-2.5,TiRex,0.65,0.45,0.85,0.035,-0.0,0.077
148
- TimesFM-2.5,FlowState,0.7,0.5,0.9,0.138,0.03,0.267
149
- TimesFM-2.5,Moirai-2.0,0.9,0.75,1.0,0.073,0.035,0.115
150
- TimesFM-2.5,TabPFN-TS-3,0.75,0.55,0.95,0.095,0.024,0.186
151
- TimesFM-2.5,TFT,0.8,0.6,0.95,0.09,0.017,0.163
152
- TimesFM-2.5,PatchTST,0.8,0.649,0.95,0.091,0.037,0.142
153
- TimesFM-2.5,Chronos-Bolt,0.85,0.65,1.0,0.136,0.068,0.199
154
- TimesFM-2.5,Seasonal Naive,1.0,1.0,1.0,0.403,0.318,0.501
155
- TiRex,Toto-2.0-2.5B,0.0,0.0,0.0,-0.17,-0.287,-0.09
156
- TiRex,Toto-2.0-1B,0.0,0.0,0.0,-0.169,-0.287,-0.092
157
- TiRex,Toto-2.0-313m,0.0,0.0,0.0,-0.157,-0.27,-0.083
158
- TiRex,Toto-2.0-22m,0.15,0.0,0.3,-0.104,-0.176,-0.05
159
- TiRex,Toto-1.0,0.2,0.05,0.4,-0.065,-0.129,-0.028
160
- TiRex,Chronos-2,0.25,0.05,0.45,-0.077,-0.146,-0.022
161
- TiRex,Toto-2.0-4m,0.25,0.1,0.45,-0.048,-0.091,-0.017
162
- TiRex,TiRex-2,0.35,0.15,0.55,-0.026,-0.077,0.006
163
- TiRex,TimesFM-2.5,0.35,0.15,0.55,-0.036,-0.083,0.0
164
- TiRex,TiRex,0.5,0.5,0.5,0.0,0.0,0.0
165
- TiRex,FlowState,0.65,0.45,0.85,0.107,-0.02,0.236
166
- TiRex,Moirai-2.0,0.8,0.6,0.95,0.039,0.014,0.065
167
- TiRex,TabPFN-TS-3,0.85,0.7,1.0,0.062,-0.03,0.149
168
- TiRex,TFT,0.8,0.6,0.95,0.056,-0.02,0.121
169
- TiRex,PatchTST,0.85,0.7,1.0,0.058,-0.029,0.118
170
- TiRex,Chronos-Bolt,0.75,0.55,0.9,0.104,0.038,0.166
171
- TiRex,Seasonal Naive,1.0,1.0,1.0,0.381,0.295,0.476
172
- FlowState,Toto-2.0-2.5B,0.1,0.0,0.25,-0.31,-0.554,-0.142
173
- FlowState,Toto-2.0-1B,0.1,0.0,0.25,-0.309,-0.563,-0.131
174
- FlowState,Toto-2.0-313m,0.1,0.0,0.25,-0.295,-0.536,-0.128
175
- FlowState,Toto-2.0-22m,0.1,0.0,0.25,-0.236,-0.442,-0.084
176
- FlowState,Toto-1.0,0.15,0.0,0.3,-0.193,-0.401,-0.043
177
- FlowState,Chronos-2,0.2,0.05,0.4,-0.206,-0.408,-0.072
178
- FlowState,Toto-2.0-4m,0.15,0.0,0.301,-0.173,-0.368,-0.033
179
- FlowState,TiRex-2,0.2,0.05,0.4,-0.149,-0.333,-0.009
180
- FlowState,TimesFM-2.5,0.3,0.1,0.5,-0.16,-0.363,-0.031
181
- FlowState,TiRex,0.35,0.15,0.55,-0.12,-0.308,0.02
182
- FlowState,FlowState,0.5,0.5,0.5,0.0,0.0,0.0
183
- FlowState,Moirai-2.0,0.4,0.2,0.6,-0.076,-0.251,0.058
184
- FlowState,TabPFN-TS-3,0.5,0.3,0.7,-0.051,-0.155,0.045
185
- FlowState,TFT,0.55,0.3,0.75,-0.057,-0.249,0.076
186
- FlowState,PatchTST,0.5,0.3,0.7,-0.055,-0.227,0.056
187
- FlowState,Chronos-Bolt,0.5,0.3,0.7,-0.003,-0.136,0.112
188
- FlowState,Seasonal Naive,0.9,0.75,1.0,0.307,0.147,0.442
189
- Moirai-2.0,Toto-2.0-2.5B,0.0,0.0,0.0,-0.218,-0.367,-0.129
190
- Moirai-2.0,Toto-2.0-1B,0.0,0.0,0.0,-0.217,-0.371,-0.126
191
- Moirai-2.0,Toto-2.0-313m,0.0,0.0,0.0,-0.204,-0.352,-0.12
192
- Moirai-2.0,Toto-2.0-22m,0.0,0.0,0.0,-0.149,-0.25,-0.088
193
- Moirai-2.0,Toto-1.0,0.05,0.0,0.15,-0.109,-0.196,-0.055
194
- Moirai-2.0,Chronos-2,0.0,0.0,0.0,-0.121,-0.202,-0.056
195
- Moirai-2.0,Toto-2.0-4m,0.0,0.0,0.0,-0.091,-0.155,-0.052
196
- Moirai-2.0,TiRex-2,0.15,0.0,0.3,-0.068,-0.137,-0.027
197
- Moirai-2.0,TimesFM-2.5,0.1,0.0,0.25,-0.078,-0.13,-0.036
198
- Moirai-2.0,TiRex,0.2,0.05,0.4,-0.041,-0.07,-0.015
199
- Moirai-2.0,FlowState,0.6,0.4,0.8,0.071,-0.062,0.201
200
- Moirai-2.0,Moirai-2.0,0.5,0.5,0.5,0.0,0.0,0.0
201
- Moirai-2.0,TabPFN-TS-3,0.65,0.45,0.85,0.024,-0.061,0.104
202
- Moirai-2.0,TFT,0.5,0.3,0.7,0.018,-0.08,0.104
203
- Moirai-2.0,PatchTST,0.6,0.4,0.8,0.019,-0.064,0.081
204
- Moirai-2.0,Chronos-Bolt,0.65,0.425,0.825,0.068,-0.002,0.135
205
- Moirai-2.0,Seasonal Naive,0.95,0.85,1.0,0.356,0.268,0.451
206
- TabPFN-TS-3,Toto-2.0-2.5B,0.05,0.0,0.15,-0.247,-0.446,-0.12
207
- TabPFN-TS-3,Toto-2.0-1B,0.05,0.0,0.15,-0.246,-0.466,-0.113
208
- TabPFN-TS-3,Toto-2.0-313m,0.05,0.0,0.15,-0.233,-0.432,-0.103
209
- TabPFN-TS-3,Toto-2.0-22m,0.05,0.0,0.15,-0.177,-0.331,-0.061
210
- TabPFN-TS-3,Toto-1.0,0.05,0.0,0.15,-0.135,-0.291,-0.025
211
- TabPFN-TS-3,Chronos-2,0.2,0.05,0.4,-0.148,-0.286,-0.055
212
- TabPFN-TS-3,Toto-2.0-4m,0.1,0.0,0.25,-0.117,-0.245,-0.014
213
- TabPFN-TS-3,TiRex-2,0.15,0.0,0.3,-0.093,-0.225,0.01
214
- TabPFN-TS-3,TimesFM-2.5,0.25,0.05,0.45,-0.104,-0.229,-0.025
215
- TabPFN-TS-3,TiRex,0.15,0.0,0.3,-0.066,-0.176,0.03
216
- TabPFN-TS-3,FlowState,0.5,0.3,0.7,0.048,-0.047,0.134
217
- TabPFN-TS-3,Moirai-2.0,0.35,0.15,0.55,-0.024,-0.116,0.057
218
- TabPFN-TS-3,TabPFN-TS-3,0.5,0.5,0.5,0.0,0.0,0.0
219
- TabPFN-TS-3,TFT,0.6,0.4,0.8,-0.006,-0.164,0.102
220
- TabPFN-TS-3,PatchTST,0.45,0.25,0.65,-0.004,-0.118,0.077
221
- TabPFN-TS-3,Chronos-Bolt,0.45,0.25,0.65,0.045,-0.057,0.144
222
- TabPFN-TS-3,Seasonal Naive,0.95,0.85,1.0,0.34,0.224,0.444
223
- TFT,Toto-2.0-2.5B,0.0,0.0,0.0,-0.24,-0.35,-0.157
224
- TFT,Toto-2.0-1B,0.0,0.0,0.0,-0.239,-0.34,-0.159
225
- TFT,Toto-2.0-313m,0.0,0.0,0.0,-0.226,-0.331,-0.15
226
- TFT,Toto-2.0-22m,0.0,0.0,0.0,-0.17,-0.266,-0.102
227
- TFT,Toto-1.0,0.1,0.0,0.25,-0.129,-0.188,-0.076
228
- TFT,Chronos-2,0.15,0.0,0.301,-0.141,-0.239,-0.069
229
- TFT,Toto-2.0-4m,0.1,0.0,0.25,-0.111,-0.191,-0.048
230
- TFT,TiRex-2,0.2,0.05,0.4,-0.087,-0.164,-0.03
231
- TFT,TimesFM-2.5,0.2,0.05,0.4,-0.098,-0.194,-0.017
232
- TFT,TiRex,0.2,0.05,0.4,-0.06,-0.138,0.02
233
- TFT,FlowState,0.45,0.25,0.7,0.053,-0.082,0.2
234
- TFT,Moirai-2.0,0.5,0.3,0.7,-0.018,-0.117,0.074
235
- TFT,TabPFN-TS-3,0.4,0.2,0.6,0.006,-0.113,0.141
236
- TFT,TFT,0.5,0.5,0.5,0.0,0.0,0.0
237
- TFT,PatchTST,0.575,0.375,0.8,0.001,-0.11,0.092
238
- TFT,Chronos-Bolt,0.55,0.35,0.75,0.051,-0.051,0.135
239
- TFT,Seasonal Naive,0.925,0.824,1.0,0.344,0.234,0.473
240
- PatchTST,Toto-2.0-2.5B,0.05,0.0,0.15,-0.242,-0.381,-0.137
241
- PatchTST,Toto-2.0-1B,0.05,0.0,0.15,-0.241,-0.383,-0.132
242
- PatchTST,Toto-2.0-313m,0.05,0.0,0.15,-0.228,-0.366,-0.118
243
- PatchTST,Toto-2.0-22m,0.1,0.0,0.25,-0.172,-0.283,-0.074
244
- PatchTST,Toto-1.0,0.1,0.0,0.25,-0.131,-0.227,-0.035
245
- PatchTST,Chronos-2,0.1,0.0,0.25,-0.143,-0.234,-0.07
246
- PatchTST,Toto-2.0-4m,0.15,0.0,0.301,-0.112,-0.197,-0.02
247
- PatchTST,TiRex-2,0.1,0.0,0.25,-0.089,-0.174,0.01
248
- PatchTST,TimesFM-2.5,0.2,0.05,0.351,-0.1,-0.166,-0.038
249
- PatchTST,TiRex,0.15,0.0,0.3,-0.061,-0.134,0.028
250
- PatchTST,FlowState,0.5,0.3,0.7,0.052,-0.059,0.185
251
- PatchTST,Moirai-2.0,0.4,0.2,0.6,-0.02,-0.089,0.06
252
- PatchTST,TabPFN-TS-3,0.55,0.35,0.75,0.004,-0.084,0.105
253
- PatchTST,TFT,0.425,0.2,0.625,-0.001,-0.101,0.099
254
- PatchTST,PatchTST,0.5,0.5,0.5,0.0,0.0,0.0
255
- PatchTST,Chronos-Bolt,0.45,0.2,0.65,0.049,-0.039,0.137
256
- PatchTST,Seasonal Naive,0.9,0.775,1.0,0.343,0.237,0.456
257
- Chronos-Bolt,Toto-2.0-2.5B,0.0,0.0,0.0,-0.307,-0.445,-0.194
258
- Chronos-Bolt,Toto-2.0-1B,0.0,0.0,0.0,-0.305,-0.452,-0.191
259
- Chronos-Bolt,Toto-2.0-313m,0.0,0.0,0.0,-0.291,-0.429,-0.186
260
- Chronos-Bolt,Toto-2.0-22m,0.0,0.0,0.0,-0.232,-0.336,-0.147
261
- Chronos-Bolt,Toto-1.0,0.1,0.0,0.25,-0.189,-0.288,-0.104
262
- Chronos-Bolt,Chronos-2,0.05,0.0,0.15,-0.202,-0.3,-0.112
263
- Chronos-Bolt,Toto-2.0-4m,0.0,0.0,0.0,-0.17,-0.252,-0.101
264
- Chronos-Bolt,TiRex-2,0.05,0.0,0.15,-0.145,-0.225,-0.077
265
- Chronos-Bolt,TimesFM-2.5,0.15,0.0,0.35,-0.157,-0.248,-0.073
266
- Chronos-Bolt,TiRex,0.25,0.1,0.45,-0.116,-0.198,-0.039
267
- Chronos-Bolt,FlowState,0.5,0.3,0.7,0.003,-0.127,0.12
268
- Chronos-Bolt,Moirai-2.0,0.35,0.175,0.575,-0.073,-0.156,0.002
269
- Chronos-Bolt,TabPFN-TS-3,0.55,0.35,0.75,-0.048,-0.169,0.054
270
- Chronos-Bolt,TFT,0.45,0.25,0.65,-0.053,-0.156,0.049
271
- Chronos-Bolt,PatchTST,0.55,0.35,0.8,-0.052,-0.159,0.037
272
- Chronos-Bolt,Chronos-Bolt,0.5,0.5,0.5,0.0,0.0,0.0
273
- Chronos-Bolt,Seasonal Naive,0.85,0.7,1.0,0.309,0.185,0.434
274
- Seasonal Naive,Toto-2.0-2.5B,0.0,0.0,0.0,-0.891,-1.422,-0.588
275
- Seasonal Naive,Toto-2.0-1B,0.0,0.0,0.0,-0.889,-1.413,-0.593
276
- Seasonal Naive,Toto-2.0-313m,0.0,0.0,0.0,-0.869,-1.396,-0.571
277
- Seasonal Naive,Toto-2.0-22m,0.0,0.0,0.0,-0.783,-1.229,-0.515
278
- Seasonal Naive,Toto-1.0,0.0,0.0,0.0,-0.721,-1.121,-0.477
279
- Seasonal Naive,Chronos-2,0.0,0.0,0.0,-0.74,-1.148,-0.496
280
- Seasonal Naive,Toto-2.0-4m,0.05,0.0,0.15,-0.693,-1.065,-0.459
281
- Seasonal Naive,TiRex-2,0.05,0.0,0.15,-0.657,-1.043,-0.414
282
- Seasonal Naive,TimesFM-2.5,0.0,0.0,0.0,-0.674,-1.003,-0.466
283
- Seasonal Naive,TiRex,0.0,0.0,0.0,-0.615,-0.909,-0.418
284
- Seasonal Naive,FlowState,0.1,0.0,0.25,-0.443,-0.793,-0.172
285
- Seasonal Naive,Moirai-2.0,0.05,0.0,0.15,-0.552,-0.822,-0.365
286
- Seasonal Naive,TabPFN-TS-3,0.05,0.0,0.15,-0.516,-0.797,-0.289
287
- Seasonal Naive,TFT,0.075,0.0,0.176,-0.524,-0.897,-0.305
288
- Seasonal Naive,PatchTST,0.1,0.0,0.225,-0.522,-0.838,-0.31
289
- Seasonal Naive,Chronos-Bolt,0.15,0.0,0.3,-0.447,-0.766,-0.228
290
- Seasonal Naive,Seasonal Naive,0.5,0.5,0.5,0.0,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_cloud/pairwise_SQL.csv DELETED
@@ -1,290 +0,0 @@
1
- model_1,model_2,win_rate,win_rate_lower,win_rate_upper,skill_score,skill_score_lower,skill_score_upper
2
- Toto-2.0-2.5B,Toto-2.0-2.5B,0.5,0.5,0.5,0.0,0.0,0.0
3
- Toto-2.0-2.5B,Toto-2.0-1B,0.7,0.5,0.851,0.0,-0.014,0.012
4
- Toto-2.0-2.5B,Toto-2.0-313m,0.8,0.6,0.95,0.007,-0.005,0.02
5
- Toto-2.0-2.5B,Toto-2.0-22m,1.0,1.0,1.0,0.057,0.035,0.084
6
- Toto-2.0-2.5B,Toto-1.0,1.0,1.0,1.0,0.098,0.06,0.139
7
- Toto-2.0-2.5B,Chronos-2,0.95,0.85,1.0,0.076,0.052,0.104
8
- Toto-2.0-2.5B,Toto-2.0-4m,1.0,1.0,1.0,0.111,0.069,0.154
9
- Toto-2.0-2.5B,TiRex-2,1.0,1.0,1.0,0.131,0.084,0.178
10
- Toto-2.0-2.5B,TimesFM-2.5,1.0,1.0,1.0,0.123,0.081,0.177
11
- Toto-2.0-2.5B,TiRex,1.0,1.0,1.0,0.148,0.088,0.214
12
- Toto-2.0-2.5B,TabPFN-TS-3,0.95,0.85,1.0,0.179,0.107,0.265
13
- Toto-2.0-2.5B,FlowState,0.9,0.75,1.0,0.244,0.135,0.358
14
- Toto-2.0-2.5B,Moirai-2.0,1.0,1.0,1.0,0.199,0.13,0.271
15
- Toto-2.0-2.5B,TFT,1.0,1.0,1.0,0.241,0.165,0.317
16
- Toto-2.0-2.5B,PatchTST,0.95,0.85,1.0,0.231,0.156,0.306
17
- Toto-2.0-2.5B,Chronos-Bolt,1.0,1.0,1.0,0.262,0.194,0.323
18
- Toto-2.0-2.5B,Seasonal Naive,1.0,1.0,1.0,0.667,0.566,0.758
19
- Toto-2.0-1B,Toto-2.0-2.5B,0.3,0.149,0.5,-0.0,-0.012,0.014
20
- Toto-2.0-1B,Toto-2.0-1B,0.5,0.5,0.5,0.0,0.0,0.0
21
- Toto-2.0-1B,Toto-2.0-313m,0.8,0.6,0.95,0.007,-0.001,0.018
22
- Toto-2.0-1B,Toto-2.0-22m,1.0,1.0,1.0,0.057,0.031,0.089
23
- Toto-2.0-1B,Toto-1.0,1.0,1.0,1.0,0.098,0.058,0.137
24
- Toto-2.0-1B,Chronos-2,0.95,0.85,1.0,0.076,0.045,0.113
25
- Toto-2.0-1B,Toto-2.0-4m,1.0,1.0,1.0,0.111,0.067,0.159
26
- Toto-2.0-1B,TiRex-2,0.95,0.85,1.0,0.131,0.083,0.181
27
- Toto-2.0-1B,TimesFM-2.5,1.0,1.0,1.0,0.123,0.079,0.184
28
- Toto-2.0-1B,TiRex,1.0,1.0,1.0,0.148,0.088,0.217
29
- Toto-2.0-1B,TabPFN-TS-3,0.95,0.85,1.0,0.179,0.102,0.272
30
- Toto-2.0-1B,FlowState,0.95,0.85,1.0,0.244,0.129,0.364
31
- Toto-2.0-1B,Moirai-2.0,1.0,1.0,1.0,0.199,0.129,0.277
32
- Toto-2.0-1B,TFT,1.0,1.0,1.0,0.241,0.163,0.314
33
- Toto-2.0-1B,PatchTST,0.95,0.85,1.0,0.231,0.149,0.311
34
- Toto-2.0-1B,Chronos-Bolt,1.0,1.0,1.0,0.262,0.192,0.328
35
- Toto-2.0-1B,Seasonal Naive,1.0,1.0,1.0,0.667,0.566,0.759
36
- Toto-2.0-313m,Toto-2.0-2.5B,0.2,0.05,0.4,-0.007,-0.021,0.005
37
- Toto-2.0-313m,Toto-2.0-1B,0.2,0.05,0.4,-0.007,-0.018,0.001
38
- Toto-2.0-313m,Toto-2.0-313m,0.5,0.5,0.5,0.0,0.0,0.0
39
- Toto-2.0-313m,Toto-2.0-22m,1.0,1.0,1.0,0.05,0.03,0.076
40
- Toto-2.0-313m,Toto-1.0,1.0,1.0,1.0,0.091,0.055,0.129
41
- Toto-2.0-313m,Chronos-2,0.95,0.85,1.0,0.069,0.038,0.106
42
- Toto-2.0-313m,Toto-2.0-4m,1.0,1.0,1.0,0.104,0.064,0.149
43
- Toto-2.0-313m,TiRex-2,0.95,0.85,1.0,0.124,0.08,0.171
44
- Toto-2.0-313m,TimesFM-2.5,0.95,0.85,1.0,0.117,0.072,0.179
45
- Toto-2.0-313m,TiRex,1.0,1.0,1.0,0.142,0.084,0.212
46
- Toto-2.0-313m,TabPFN-TS-3,0.95,0.85,1.0,0.173,0.093,0.266
47
- Toto-2.0-313m,FlowState,0.95,0.85,1.0,0.238,0.125,0.356
48
- Toto-2.0-313m,Moirai-2.0,1.0,1.0,1.0,0.193,0.124,0.271
49
- Toto-2.0-313m,TFT,1.0,1.0,1.0,0.235,0.16,0.307
50
- Toto-2.0-313m,PatchTST,0.95,0.85,1.0,0.225,0.146,0.305
51
- Toto-2.0-313m,Chronos-Bolt,1.0,1.0,1.0,0.256,0.19,0.318
52
- Toto-2.0-313m,Seasonal Naive,1.0,1.0,1.0,0.664,0.561,0.758
53
- Toto-2.0-22m,Toto-2.0-2.5B,0.0,0.0,0.0,-0.061,-0.091,-0.036
54
- Toto-2.0-22m,Toto-2.0-1B,0.0,0.0,0.0,-0.061,-0.098,-0.032
55
- Toto-2.0-22m,Toto-2.0-313m,0.0,0.0,0.0,-0.053,-0.082,-0.031
56
- Toto-2.0-22m,Toto-2.0-22m,0.5,0.5,0.5,0.0,0.0,0.0
57
- Toto-2.0-22m,Toto-1.0,0.85,0.7,1.0,0.043,0.02,0.071
58
- Toto-2.0-22m,Chronos-2,0.85,0.7,1.0,0.02,-0.019,0.047
59
- Toto-2.0-22m,Toto-2.0-4m,1.0,1.0,1.0,0.057,0.034,0.082
60
- Toto-2.0-22m,TiRex-2,0.95,0.85,1.0,0.078,0.049,0.106
61
- Toto-2.0-22m,TimesFM-2.5,0.85,0.699,1.0,0.07,0.023,0.119
62
- Toto-2.0-22m,TiRex,0.95,0.85,1.0,0.097,0.053,0.149
63
- Toto-2.0-22m,TabPFN-TS-3,0.95,0.85,1.0,0.129,0.048,0.211
64
- Toto-2.0-22m,FlowState,0.9,0.75,1.0,0.198,0.085,0.312
65
- Toto-2.0-22m,Moirai-2.0,1.0,1.0,1.0,0.15,0.094,0.211
66
- Toto-2.0-22m,TFT,1.0,1.0,1.0,0.195,0.126,0.267
67
- Toto-2.0-22m,PatchTST,0.95,0.85,1.0,0.184,0.101,0.256
68
- Toto-2.0-22m,Chronos-Bolt,1.0,1.0,1.0,0.217,0.158,0.27
69
- Toto-2.0-22m,Seasonal Naive,1.0,1.0,1.0,0.646,0.539,0.743
70
- Toto-1.0,Toto-2.0-2.5B,0.0,0.0,0.0,-0.109,-0.162,-0.064
71
- Toto-1.0,Toto-2.0-1B,0.0,0.0,0.0,-0.108,-0.159,-0.062
72
- Toto-1.0,Toto-2.0-313m,0.0,0.0,0.0,-0.1,-0.148,-0.058
73
- Toto-1.0,Toto-2.0-22m,0.15,0.0,0.3,-0.045,-0.076,-0.02
74
- Toto-1.0,Toto-1.0,0.5,0.5,0.5,0.0,0.0,0.0
75
- Toto-1.0,Chronos-2,0.6,0.4,0.8,-0.024,-0.08,0.018
76
- Toto-1.0,Toto-2.0-4m,0.7,0.5,0.9,0.014,-0.008,0.036
77
- Toto-1.0,TiRex-2,0.85,0.7,1.0,0.037,0.012,0.06
78
- Toto-1.0,TimesFM-2.5,0.75,0.55,0.95,0.028,-0.025,0.076
79
- Toto-1.0,TiRex,0.8,0.6,0.95,0.056,0.022,0.104
80
- Toto-1.0,TabPFN-TS-3,0.95,0.85,1.0,0.09,0.005,0.175
81
- Toto-1.0,FlowState,0.85,0.7,1.0,0.162,0.04,0.284
82
- Toto-1.0,Moirai-2.0,0.95,0.85,1.0,0.112,0.064,0.169
83
- Toto-1.0,TFT,0.95,0.85,1.0,0.158,0.096,0.217
84
- Toto-1.0,PatchTST,0.9,0.75,1.0,0.148,0.055,0.221
85
- Toto-1.0,Chronos-Bolt,0.95,0.85,1.0,0.182,0.124,0.236
86
- Toto-1.0,Seasonal Naive,1.0,1.0,1.0,0.631,0.52,0.73
87
- Chronos-2,Toto-2.0-2.5B,0.05,0.0,0.15,-0.082,-0.116,-0.055
88
- Chronos-2,Toto-2.0-1B,0.05,0.0,0.15,-0.082,-0.127,-0.047
89
- Chronos-2,Toto-2.0-313m,0.05,0.0,0.15,-0.074,-0.119,-0.039
90
- Chronos-2,Toto-2.0-22m,0.15,0.0,0.3,-0.02,-0.049,0.019
91
- Chronos-2,Toto-1.0,0.4,0.2,0.6,0.024,-0.018,0.074
92
- Chronos-2,Chronos-2,0.5,0.5,0.5,0.0,0.0,0.0
93
- Chronos-2,Toto-2.0-4m,0.6,0.35,0.8,0.038,0.001,0.085
94
- Chronos-2,TiRex-2,0.65,0.4,0.85,0.059,0.017,0.111
95
- Chronos-2,TimesFM-2.5,0.75,0.55,0.9,0.051,0.017,0.09
96
- Chronos-2,TiRex,0.75,0.55,0.9,0.078,0.024,0.139
97
- Chronos-2,TabPFN-TS-3,0.85,0.7,1.0,0.111,0.053,0.183
98
- Chronos-2,FlowState,0.85,0.65,1.0,0.182,0.078,0.296
99
- Chronos-2,Moirai-2.0,1.0,1.0,1.0,0.133,0.069,0.2
100
- Chronos-2,TFT,0.9,0.75,1.0,0.178,0.097,0.258
101
- Chronos-2,PatchTST,0.85,0.7,1.0,0.168,0.103,0.231
102
- Chronos-2,Chronos-Bolt,1.0,1.0,1.0,0.201,0.134,0.261
103
- Chronos-2,Seasonal Naive,1.0,1.0,1.0,0.639,0.533,0.735
104
- Toto-2.0-4m,Toto-2.0-2.5B,0.0,0.0,0.0,-0.125,-0.182,-0.074
105
- Toto-2.0-4m,Toto-2.0-1B,0.0,0.0,0.0,-0.125,-0.189,-0.072
106
- Toto-2.0-4m,Toto-2.0-313m,0.0,0.0,0.0,-0.116,-0.175,-0.069
107
- Toto-2.0-4m,Toto-2.0-22m,0.0,0.0,0.0,-0.06,-0.089,-0.035
108
- Toto-2.0-4m,Toto-1.0,0.3,0.1,0.5,-0.015,-0.037,0.008
109
- Toto-2.0-4m,Chronos-2,0.4,0.2,0.65,-0.039,-0.093,-0.001
110
- Toto-2.0-4m,Toto-2.0-4m,0.5,0.5,0.5,0.0,0.0,0.0
111
- Toto-2.0-4m,TiRex-2,0.8,0.6,0.95,0.022,0.009,0.035
112
- Toto-2.0-4m,TimesFM-2.5,0.65,0.4,0.85,0.014,-0.039,0.056
113
- Toto-2.0-4m,TiRex,0.75,0.55,0.9,0.042,0.015,0.077
114
- Toto-2.0-4m,TabPFN-TS-3,0.85,0.7,1.0,0.076,-0.009,0.147
115
- Toto-2.0-4m,FlowState,0.9,0.75,1.0,0.15,0.028,0.27
116
- Toto-2.0-4m,Moirai-2.0,1.0,1.0,1.0,0.099,0.061,0.145
117
- Toto-2.0-4m,TFT,0.9,0.75,1.0,0.146,0.077,0.211
118
- Toto-2.0-4m,PatchTST,0.9,0.75,1.0,0.135,0.047,0.204
119
- Toto-2.0-4m,Chronos-Bolt,1.0,1.0,1.0,0.17,0.12,0.218
120
- Toto-2.0-4m,Seasonal Naive,1.0,1.0,1.0,0.625,0.515,0.726
121
- TiRex-2,Toto-2.0-2.5B,0.0,0.0,0.0,-0.151,-0.216,-0.092
122
- TiRex-2,Toto-2.0-1B,0.05,0.0,0.15,-0.15,-0.22,-0.09
123
- TiRex-2,Toto-2.0-313m,0.05,0.0,0.15,-0.142,-0.206,-0.087
124
- TiRex-2,Toto-2.0-22m,0.05,0.0,0.15,-0.085,-0.119,-0.051
125
- TiRex-2,Toto-1.0,0.15,0.0,0.3,-0.038,-0.064,-0.012
126
- TiRex-2,Chronos-2,0.35,0.15,0.6,-0.063,-0.125,-0.017
127
- TiRex-2,Toto-2.0-4m,0.2,0.05,0.4,-0.023,-0.037,-0.009
128
- TiRex-2,TiRex-2,0.5,0.5,0.5,0.0,0.0,0.0
129
- TiRex-2,TimesFM-2.5,0.55,0.349,0.75,-0.009,-0.07,0.04
130
- TiRex-2,TiRex,0.65,0.45,0.85,0.02,-0.01,0.064
131
- TiRex-2,TabPFN-TS-3,0.85,0.7,1.0,0.055,-0.036,0.135
132
- TiRex-2,FlowState,0.85,0.699,1.0,0.13,0.007,0.247
133
- TiRex-2,Moirai-2.0,0.9,0.75,1.0,0.078,0.043,0.128
134
- TiRex-2,TFT,0.85,0.7,0.95,0.127,0.064,0.19
135
- TiRex-2,PatchTST,0.95,0.85,1.0,0.115,0.021,0.184
136
- TiRex-2,Chronos-Bolt,0.95,0.85,1.0,0.151,0.106,0.197
137
- TiRex-2,Seasonal Naive,1.0,1.0,1.0,0.617,0.505,0.72
138
- TimesFM-2.5,Toto-2.0-2.5B,0.0,0.0,0.0,-0.141,-0.216,-0.088
139
- TimesFM-2.5,Toto-2.0-1B,0.0,0.0,0.0,-0.141,-0.226,-0.086
140
- TimesFM-2.5,Toto-2.0-313m,0.05,0.0,0.15,-0.132,-0.218,-0.078
141
- TimesFM-2.5,Toto-2.0-22m,0.15,0.0,0.301,-0.075,-0.136,-0.024
142
- TimesFM-2.5,Toto-1.0,0.25,0.05,0.45,-0.029,-0.082,0.024
143
- TimesFM-2.5,Chronos-2,0.25,0.1,0.45,-0.054,-0.099,-0.017
144
- TimesFM-2.5,Toto-2.0-4m,0.35,0.15,0.6,-0.014,-0.059,0.038
145
- TimesFM-2.5,TiRex-2,0.45,0.25,0.651,0.009,-0.041,0.065
146
- TimesFM-2.5,TimesFM-2.5,0.5,0.5,0.5,0.0,0.0,0.0
147
- TimesFM-2.5,TiRex,0.6,0.4,0.8,0.028,-0.014,0.08
148
- TimesFM-2.5,TabPFN-TS-3,0.75,0.55,0.95,0.063,0.005,0.129
149
- TimesFM-2.5,FlowState,0.85,0.7,1.0,0.138,0.034,0.263
150
- TimesFM-2.5,Moirai-2.0,0.9,0.75,1.0,0.086,0.038,0.143
151
- TimesFM-2.5,TFT,0.8,0.6,0.95,0.134,0.04,0.217
152
- TimesFM-2.5,PatchTST,0.8,0.649,0.95,0.123,0.058,0.187
153
- TimesFM-2.5,Chronos-Bolt,0.9,0.75,1.0,0.158,0.095,0.217
154
- TimesFM-2.5,Seasonal Naive,1.0,1.0,1.0,0.62,0.519,0.713
155
- TiRex,Toto-2.0-2.5B,0.0,0.0,0.0,-0.174,-0.273,-0.097
156
- TiRex,Toto-2.0-1B,0.0,0.0,0.0,-0.174,-0.277,-0.096
157
- TiRex,Toto-2.0-313m,0.0,0.0,0.0,-0.166,-0.27,-0.091
158
- TiRex,Toto-2.0-22m,0.05,0.0,0.15,-0.107,-0.176,-0.056
159
- TiRex,Toto-1.0,0.2,0.05,0.4,-0.059,-0.116,-0.023
160
- TiRex,Chronos-2,0.25,0.1,0.45,-0.085,-0.162,-0.025
161
- TiRex,Toto-2.0-4m,0.25,0.1,0.45,-0.044,-0.083,-0.015
162
- TiRex,TiRex-2,0.35,0.15,0.55,-0.02,-0.068,0.01
163
- TiRex,TimesFM-2.5,0.4,0.2,0.6,-0.029,-0.086,0.013
164
- TiRex,TiRex,0.5,0.5,0.5,0.0,0.0,0.0
165
- TiRex,TabPFN-TS-3,0.8,0.6,0.95,0.036,-0.056,0.102
166
- TiRex,FlowState,0.7,0.5,0.9,0.112,-0.021,0.241
167
- TiRex,Moirai-2.0,0.85,0.7,1.0,0.059,0.03,0.09
168
- TiRex,TFT,0.8,0.6,0.95,0.109,0.017,0.181
169
- TiRex,PatchTST,0.8,0.6,0.95,0.097,-0.003,0.171
170
- TiRex,Chronos-Bolt,0.9,0.75,1.0,0.133,0.073,0.186
171
- TiRex,Seasonal Naive,1.0,1.0,1.0,0.609,0.499,0.709
172
- TabPFN-TS-3,Toto-2.0-2.5B,0.05,0.0,0.15,-0.218,-0.361,-0.12
173
- TabPFN-TS-3,Toto-2.0-1B,0.05,0.0,0.15,-0.218,-0.374,-0.114
174
- TabPFN-TS-3,Toto-2.0-313m,0.05,0.0,0.15,-0.209,-0.363,-0.103
175
- TabPFN-TS-3,Toto-2.0-22m,0.05,0.0,0.15,-0.148,-0.267,-0.05
176
- TabPFN-TS-3,Toto-1.0,0.05,0.0,0.15,-0.098,-0.212,-0.005
177
- TabPFN-TS-3,Chronos-2,0.15,0.0,0.3,-0.125,-0.223,-0.057
178
- TabPFN-TS-3,Toto-2.0-4m,0.15,0.0,0.3,-0.083,-0.172,0.009
179
- TabPFN-TS-3,TiRex-2,0.15,0.0,0.3,-0.058,-0.156,0.035
180
- TabPFN-TS-3,TimesFM-2.5,0.25,0.05,0.45,-0.067,-0.148,-0.006
181
- TabPFN-TS-3,TiRex,0.2,0.05,0.4,-0.037,-0.113,0.053
182
- TabPFN-TS-3,TabPFN-TS-3,0.5,0.5,0.5,0.0,0.0,0.0
183
- TabPFN-TS-3,FlowState,0.5,0.3,0.7,0.08,-0.032,0.187
184
- TabPFN-TS-3,Moirai-2.0,0.45,0.25,0.65,0.024,-0.037,0.104
185
- TabPFN-TS-3,TFT,0.7,0.5,0.9,0.076,-0.051,0.174
186
- TabPFN-TS-3,PatchTST,0.7,0.5,0.9,0.064,-0.012,0.126
187
- TabPFN-TS-3,Chronos-Bolt,0.65,0.4,0.85,0.101,0.008,0.193
188
- TabPFN-TS-3,Seasonal Naive,1.0,1.0,1.0,0.594,0.486,0.694
189
- FlowState,Toto-2.0-2.5B,0.1,0.0,0.25,-0.323,-0.558,-0.156
190
- FlowState,Toto-2.0-1B,0.05,0.0,0.15,-0.323,-0.571,-0.148
191
- FlowState,Toto-2.0-313m,0.05,0.0,0.15,-0.313,-0.553,-0.142
192
- FlowState,Toto-2.0-22m,0.1,0.0,0.25,-0.247,-0.453,-0.093
193
- FlowState,Toto-1.0,0.15,0.0,0.3,-0.193,-0.397,-0.041
194
- FlowState,Chronos-2,0.15,0.0,0.35,-0.222,-0.421,-0.084
195
- FlowState,Toto-2.0-4m,0.1,0.0,0.25,-0.176,-0.37,-0.029
196
- FlowState,TiRex-2,0.15,0.0,0.301,-0.15,-0.328,-0.007
197
- FlowState,TimesFM-2.5,0.15,0.0,0.3,-0.16,-0.356,-0.035
198
- FlowState,TiRex,0.3,0.1,0.5,-0.127,-0.318,0.02
199
- FlowState,TabPFN-TS-3,0.5,0.3,0.7,-0.086,-0.23,0.031
200
- FlowState,FlowState,0.5,0.5,0.5,0.0,0.0,0.0
201
- FlowState,Moirai-2.0,0.4,0.2,0.6,-0.06,-0.225,0.076
202
- FlowState,TFT,0.55,0.3,0.75,-0.004,-0.165,0.115
203
- FlowState,PatchTST,0.5,0.3,0.7,-0.017,-0.152,0.083
204
- FlowState,Chronos-Bolt,0.55,0.35,0.75,0.023,-0.108,0.139
205
- FlowState,Seasonal Naive,0.95,0.85,1.0,0.559,0.424,0.672
206
- Moirai-2.0,Toto-2.0-2.5B,0.0,0.0,0.0,-0.248,-0.371,-0.15
207
- Moirai-2.0,Toto-2.0-1B,0.0,0.0,0.0,-0.248,-0.383,-0.148
208
- Moirai-2.0,Toto-2.0-313m,0.0,0.0,0.0,-0.239,-0.371,-0.142
209
- Moirai-2.0,Toto-2.0-22m,0.0,0.0,0.0,-0.176,-0.267,-0.104
210
- Moirai-2.0,Toto-1.0,0.05,0.0,0.15,-0.126,-0.203,-0.068
211
- Moirai-2.0,Chronos-2,0.0,0.0,0.0,-0.153,-0.249,-0.074
212
- Moirai-2.0,Toto-2.0-4m,0.0,0.0,0.0,-0.109,-0.169,-0.065
213
- Moirai-2.0,TiRex-2,0.1,0.0,0.25,-0.085,-0.146,-0.045
214
- Moirai-2.0,TimesFM-2.5,0.1,0.0,0.25,-0.094,-0.167,-0.039
215
- Moirai-2.0,TiRex,0.15,0.0,0.3,-0.063,-0.099,-0.03
216
- Moirai-2.0,TabPFN-TS-3,0.55,0.35,0.75,-0.025,-0.116,0.035
217
- Moirai-2.0,FlowState,0.6,0.4,0.8,0.057,-0.083,0.184
218
- Moirai-2.0,Moirai-2.0,0.5,0.5,0.5,0.0,0.0,0.0
219
- Moirai-2.0,TFT,0.65,0.4,0.85,0.053,-0.052,0.142
220
- Moirai-2.0,PatchTST,0.65,0.45,0.85,0.041,-0.065,0.115
221
- Moirai-2.0,Chronos-Bolt,0.8,0.6,0.95,0.079,0.017,0.14
222
- Moirai-2.0,Seasonal Naive,1.0,1.0,1.0,0.584,0.469,0.689
223
- TFT,Toto-2.0-2.5B,0.0,0.0,0.0,-0.317,-0.464,-0.198
224
- TFT,Toto-2.0-1B,0.0,0.0,0.0,-0.317,-0.457,-0.195
225
- TFT,Toto-2.0-313m,0.0,0.0,0.0,-0.308,-0.444,-0.191
226
- TFT,Toto-2.0-22m,0.0,0.0,0.0,-0.242,-0.363,-0.144
227
- TFT,Toto-1.0,0.05,0.0,0.15,-0.188,-0.277,-0.106
228
- TFT,Chronos-2,0.1,0.0,0.25,-0.217,-0.348,-0.107
229
- TFT,Toto-2.0-4m,0.1,0.0,0.25,-0.171,-0.267,-0.084
230
- TFT,TiRex-2,0.15,0.05,0.3,-0.145,-0.235,-0.068
231
- TFT,TimesFM-2.5,0.2,0.05,0.4,-0.155,-0.277,-0.042
232
- TFT,TiRex,0.2,0.05,0.4,-0.122,-0.221,-0.018
233
- TFT,TabPFN-TS-3,0.3,0.1,0.5,-0.082,-0.21,0.049
234
- TFT,FlowState,0.45,0.25,0.7,0.004,-0.13,0.142
235
- TFT,Moirai-2.0,0.35,0.15,0.6,-0.056,-0.166,0.049
236
- TFT,TFT,0.5,0.5,0.5,0.0,0.0,0.0
237
- TFT,PatchTST,0.575,0.375,0.8,-0.013,-0.135,0.076
238
- TFT,Chronos-Bolt,0.6,0.4,0.8,0.028,-0.073,0.104
239
- TFT,Seasonal Naive,0.9,0.75,1.0,0.561,0.416,0.683
240
- PatchTST,Toto-2.0-2.5B,0.05,0.0,0.15,-0.301,-0.442,-0.186
241
- PatchTST,Toto-2.0-1B,0.05,0.0,0.15,-0.3,-0.452,-0.175
242
- PatchTST,Toto-2.0-313m,0.05,0.0,0.15,-0.291,-0.438,-0.17
243
- PatchTST,Toto-2.0-22m,0.05,0.0,0.15,-0.226,-0.344,-0.113
244
- PatchTST,Toto-1.0,0.1,0.0,0.25,-0.173,-0.284,-0.058
245
- PatchTST,Chronos-2,0.15,0.0,0.3,-0.202,-0.3,-0.115
246
- PatchTST,Toto-2.0-4m,0.1,0.0,0.25,-0.156,-0.256,-0.049
247
- PatchTST,TiRex-2,0.05,0.0,0.15,-0.13,-0.226,-0.022
248
- PatchTST,TimesFM-2.5,0.2,0.05,0.351,-0.14,-0.23,-0.061
249
- PatchTST,TiRex,0.2,0.05,0.4,-0.108,-0.207,0.003
250
- PatchTST,TabPFN-TS-3,0.3,0.1,0.5,-0.068,-0.144,0.012
251
- PatchTST,FlowState,0.5,0.3,0.7,0.017,-0.09,0.132
252
- PatchTST,Moirai-2.0,0.35,0.15,0.55,-0.042,-0.129,0.061
253
- PatchTST,TFT,0.425,0.2,0.625,0.013,-0.082,0.119
254
- PatchTST,PatchTST,0.5,0.5,0.5,0.0,0.0,0.0
255
- PatchTST,Chronos-Bolt,0.4,0.2,0.6,0.04,-0.034,0.126
256
- PatchTST,Seasonal Naive,0.9,0.75,1.0,0.567,0.435,0.68
257
- Chronos-Bolt,Toto-2.0-2.5B,0.0,0.0,0.0,-0.355,-0.477,-0.24
258
- Chronos-Bolt,Toto-2.0-1B,0.0,0.0,0.0,-0.354,-0.487,-0.237
259
- Chronos-Bolt,Toto-2.0-313m,0.0,0.0,0.0,-0.345,-0.466,-0.235
260
- Chronos-Bolt,Toto-2.0-22m,0.0,0.0,0.0,-0.277,-0.37,-0.188
261
- Chronos-Bolt,Toto-1.0,0.05,0.0,0.15,-0.222,-0.31,-0.141
262
- Chronos-Bolt,Chronos-2,0.0,0.0,0.0,-0.251,-0.352,-0.155
263
- Chronos-Bolt,Toto-2.0-4m,0.0,0.0,0.0,-0.204,-0.279,-0.137
264
- Chronos-Bolt,TiRex-2,0.05,0.0,0.15,-0.177,-0.246,-0.119
265
- Chronos-Bolt,TimesFM-2.5,0.1,0.0,0.25,-0.187,-0.277,-0.105
266
- Chronos-Bolt,TiRex,0.1,0.0,0.25,-0.154,-0.229,-0.079
267
- Chronos-Bolt,TabPFN-TS-3,0.35,0.15,0.6,-0.112,-0.239,-0.008
268
- Chronos-Bolt,FlowState,0.45,0.25,0.65,-0.024,-0.161,0.097
269
- Chronos-Bolt,Moirai-2.0,0.2,0.05,0.4,-0.086,-0.162,-0.017
270
- Chronos-Bolt,TFT,0.4,0.2,0.6,-0.028,-0.116,0.068
271
- Chronos-Bolt,PatchTST,0.6,0.4,0.8,-0.042,-0.144,0.033
272
- Chronos-Bolt,Chronos-Bolt,0.5,0.5,0.5,0.0,0.0,0.0
273
- Chronos-Bolt,Seasonal Naive,0.9,0.75,1.0,0.549,0.413,0.67
274
- Seasonal Naive,Toto-2.0-2.5B,0.0,0.0,0.0,-2.001,-3.137,-1.304
275
- Seasonal Naive,Toto-2.0-1B,0.0,0.0,0.0,-2.001,-3.152,-1.302
276
- Seasonal Naive,Toto-2.0-313m,0.0,0.0,0.0,-1.979,-3.139,-1.28
277
- Seasonal Naive,Toto-2.0-22m,0.0,0.0,0.0,-1.829,-2.894,-1.168
278
- Seasonal Naive,Toto-1.0,0.0,0.0,0.0,-1.707,-2.709,-1.085
279
- Seasonal Naive,Chronos-2,0.0,0.0,0.0,-1.772,-2.77,-1.139
280
- Seasonal Naive,Toto-2.0-4m,0.0,0.0,0.0,-1.668,-2.646,-1.063
281
- Seasonal Naive,TiRex-2,0.0,0.0,0.0,-1.608,-2.568,-1.019
282
- Seasonal Naive,TimesFM-2.5,0.0,0.0,0.0,-1.631,-2.486,-1.077
283
- Seasonal Naive,TiRex,0.0,0.0,0.0,-1.556,-2.437,-0.997
284
- Seasonal Naive,TabPFN-TS-3,0.0,0.0,0.0,-1.464,-2.271,-0.947
285
- Seasonal Naive,FlowState,0.05,0.0,0.15,-1.268,-2.052,-0.736
286
- Seasonal Naive,Moirai-2.0,0.0,0.0,0.0,-1.405,-2.214,-0.883
287
- Seasonal Naive,TFT,0.1,0.0,0.25,-1.278,-2.153,-0.713
288
- Seasonal Naive,PatchTST,0.1,0.0,0.25,-1.307,-2.121,-0.769
289
- Seasonal Naive,Chronos-Bolt,0.1,0.0,0.25,-1.215,-2.027,-0.704
290
- Seasonal Naive,Seasonal Naive,0.5,0.5,0.5,0.0,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_cloud/pairwise_WAPE.csv DELETED
@@ -1,290 +0,0 @@
1
- model_1,model_2,win_rate,win_rate_lower,win_rate_upper,skill_score,skill_score_lower,skill_score_upper
2
- Toto-2.0-2.5B,Toto-2.0-2.5B,0.5,0.5,0.5,0.0,0.0,0.0
3
- Toto-2.0-2.5B,Toto-2.0-1B,0.65,0.4,0.85,0.013,-0.0,0.033
4
- Toto-2.0-2.5B,Toto-2.0-313m,0.85,0.65,1.0,0.021,0.003,0.051
5
- Toto-2.0-2.5B,Toto-2.0-22m,1.0,1.0,1.0,0.071,0.029,0.124
6
- Toto-2.0-2.5B,Chronos-2,0.9,0.75,1.0,0.063,0.023,0.11
7
- Toto-2.0-2.5B,Toto-1.0,1.0,1.0,1.0,0.125,0.053,0.213
8
- Toto-2.0-2.5B,Toto-2.0-4m,1.0,1.0,1.0,0.125,0.066,0.193
9
- Toto-2.0-2.5B,TiRex-2,1.0,1.0,1.0,0.134,0.073,0.209
10
- Toto-2.0-2.5B,TimesFM-2.5,0.95,0.85,1.0,0.139,0.086,0.203
11
- Toto-2.0-2.5B,TiRex,1.0,1.0,1.0,0.166,0.087,0.257
12
- Toto-2.0-2.5B,FlowState,0.95,0.85,1.0,0.168,0.079,0.256
13
- Toto-2.0-2.5B,TabPFN-TS-3,0.95,0.85,1.0,0.139,0.049,0.245
14
- Toto-2.0-2.5B,TabPFN-TS,1.0,1.0,1.0,0.198,0.141,0.267
15
- Toto-2.0-2.5B,Moirai-2.0,1.0,1.0,1.0,0.191,0.114,0.276
16
- Toto-2.0-2.5B,PatchTST,0.95,0.85,1.0,0.191,0.095,0.279
17
- Toto-2.0-2.5B,Chronos-Bolt,1.0,1.0,1.0,0.23,0.156,0.302
18
- Toto-2.0-2.5B,Seasonal Naive,1.0,1.0,1.0,0.537,0.421,0.654
19
- Toto-2.0-1B,Toto-2.0-2.5B,0.35,0.15,0.6,-0.013,-0.034,0.0
20
- Toto-2.0-1B,Toto-2.0-1B,0.5,0.5,0.5,0.0,0.0,0.0
21
- Toto-2.0-1B,Toto-2.0-313m,0.7,0.5,0.9,0.009,-0.002,0.023
22
- Toto-2.0-1B,Toto-2.0-22m,1.0,1.0,1.0,0.058,0.025,0.099
23
- Toto-2.0-1B,Chronos-2,0.9,0.75,1.0,0.051,-0.006,0.103
24
- Toto-2.0-1B,Toto-1.0,1.0,1.0,1.0,0.113,0.051,0.188
25
- Toto-2.0-1B,Toto-2.0-4m,1.0,1.0,1.0,0.113,0.062,0.171
26
- Toto-2.0-1B,TiRex-2,1.0,1.0,1.0,0.122,0.069,0.184
27
- Toto-2.0-1B,TimesFM-2.5,1.0,1.0,1.0,0.127,0.081,0.191
28
- Toto-2.0-1B,TiRex,1.0,1.0,1.0,0.155,0.082,0.239
29
- Toto-2.0-1B,FlowState,0.95,0.85,1.0,0.157,0.056,0.251
30
- Toto-2.0-1B,TabPFN-TS-3,0.95,0.85,1.0,0.128,0.019,0.239
31
- Toto-2.0-1B,TabPFN-TS,1.0,1.0,1.0,0.187,0.136,0.254
32
- Toto-2.0-1B,Moirai-2.0,1.0,1.0,1.0,0.18,0.109,0.265
33
- Toto-2.0-1B,PatchTST,0.95,0.85,1.0,0.181,0.07,0.275
34
- Toto-2.0-1B,Chronos-Bolt,1.0,1.0,1.0,0.22,0.152,0.285
35
- Toto-2.0-1B,Seasonal Naive,1.0,1.0,1.0,0.531,0.419,0.647
36
- Toto-2.0-313m,Toto-2.0-2.5B,0.15,0.0,0.35,-0.022,-0.054,-0.003
37
- Toto-2.0-313m,Toto-2.0-1B,0.3,0.1,0.5,-0.009,-0.023,0.002
38
- Toto-2.0-313m,Toto-2.0-313m,0.5,0.5,0.5,0.0,0.0,0.0
39
- Toto-2.0-313m,Toto-2.0-22m,1.0,1.0,1.0,0.05,0.024,0.082
40
- Toto-2.0-313m,Chronos-2,0.9,0.75,1.0,0.043,-0.025,0.097
41
- Toto-2.0-313m,Toto-1.0,1.0,1.0,1.0,0.106,0.048,0.177
42
- Toto-2.0-313m,Toto-2.0-4m,1.0,1.0,1.0,0.106,0.06,0.159
43
- Toto-2.0-313m,TiRex-2,1.0,1.0,1.0,0.115,0.068,0.169
44
- Toto-2.0-313m,TimesFM-2.5,1.0,1.0,1.0,0.12,0.076,0.18
45
- Toto-2.0-313m,TiRex,1.0,1.0,1.0,0.147,0.08,0.229
46
- Toto-2.0-313m,FlowState,0.95,0.85,1.0,0.149,0.038,0.248
47
- Toto-2.0-313m,TabPFN-TS-3,0.95,0.85,1.0,0.121,-0.004,0.231
48
- Toto-2.0-313m,TabPFN-TS,1.0,1.0,1.0,0.18,0.131,0.245
49
- Toto-2.0-313m,Moirai-2.0,1.0,1.0,1.0,0.173,0.108,0.251
50
- Toto-2.0-313m,PatchTST,0.95,0.85,1.0,0.174,0.052,0.27
51
- Toto-2.0-313m,Chronos-Bolt,1.0,1.0,1.0,0.213,0.151,0.275
52
- Toto-2.0-313m,Seasonal Naive,1.0,1.0,1.0,0.527,0.414,0.642
53
- Toto-2.0-22m,Toto-2.0-2.5B,0.0,0.0,0.0,-0.076,-0.142,-0.03
54
- Toto-2.0-22m,Toto-2.0-1B,0.0,0.0,0.0,-0.062,-0.11,-0.026
55
- Toto-2.0-22m,Toto-2.0-313m,0.0,0.0,0.0,-0.053,-0.089,-0.025
56
- Toto-2.0-22m,Toto-2.0-22m,0.5,0.5,0.5,0.0,0.0,0.0
57
- Toto-2.0-22m,Chronos-2,0.8,0.6,0.95,-0.008,-0.096,0.044
58
- Toto-2.0-22m,Toto-1.0,0.9,0.75,1.0,0.059,0.02,0.114
59
- Toto-2.0-22m,Toto-2.0-4m,1.0,1.0,1.0,0.058,0.034,0.085
60
- Toto-2.0-22m,TiRex-2,0.95,0.85,1.0,0.068,0.042,0.099
61
- Toto-2.0-22m,TimesFM-2.5,0.9,0.75,1.0,0.073,0.036,0.118
62
- Toto-2.0-22m,TiRex,0.95,0.85,1.0,0.102,0.053,0.16
63
- Toto-2.0-22m,FlowState,0.95,0.85,1.0,0.104,-0.035,0.209
64
- Toto-2.0-22m,TabPFN-TS-3,0.95,0.85,1.0,0.074,-0.075,0.178
65
- Toto-2.0-22m,TabPFN-TS,0.9,0.75,1.0,0.137,0.098,0.186
66
- Toto-2.0-22m,Moirai-2.0,1.0,1.0,1.0,0.129,0.081,0.192
67
- Toto-2.0-22m,PatchTST,0.95,0.85,1.0,0.13,-0.014,0.227
68
- Toto-2.0-22m,Chronos-Bolt,1.0,1.0,1.0,0.171,0.122,0.223
69
- Toto-2.0-22m,Seasonal Naive,1.0,1.0,1.0,0.502,0.392,0.613
70
- Chronos-2,Toto-2.0-2.5B,0.1,0.0,0.25,-0.068,-0.124,-0.023
71
- Chronos-2,Toto-2.0-1B,0.1,0.0,0.25,-0.054,-0.115,0.006
72
- Chronos-2,Toto-2.0-313m,0.1,0.0,0.25,-0.045,-0.107,0.024
73
- Chronos-2,Toto-2.0-22m,0.2,0.05,0.4,0.008,-0.046,0.087
74
- Chronos-2,Chronos-2,0.5,0.5,0.5,0.0,0.0,0.0
75
- Chronos-2,Toto-1.0,0.35,0.15,0.55,0.066,-0.014,0.174
76
- Chronos-2,Toto-2.0-4m,0.6,0.35,0.8,0.066,0.005,0.155
77
- Chronos-2,TiRex-2,0.85,0.65,1.0,0.075,0.013,0.169
78
- Chronos-2,TimesFM-2.5,0.75,0.55,0.9,0.08,0.03,0.14
79
- Chronos-2,TiRex,0.8,0.6,0.95,0.109,0.032,0.209
80
- Chronos-2,FlowState,0.8,0.6,0.95,0.111,0.049,0.183
81
- Chronos-2,TabPFN-TS-3,0.85,0.65,1.0,0.081,0.019,0.155
82
- Chronos-2,TabPFN-TS,0.95,0.85,1.0,0.143,0.087,0.216
83
- Chronos-2,Moirai-2.0,1.0,1.0,1.0,0.136,0.059,0.226
84
- Chronos-2,PatchTST,0.85,0.7,1.0,0.137,0.061,0.205
85
- Chronos-2,Chronos-Bolt,1.0,1.0,1.0,0.178,0.103,0.259
86
- Chronos-2,Seasonal Naive,1.0,1.0,1.0,0.506,0.388,0.617
87
- Toto-1.0,Toto-2.0-2.5B,0.0,0.0,0.0,-0.143,-0.27,-0.056
88
- Toto-1.0,Toto-2.0-1B,0.0,0.0,0.0,-0.128,-0.232,-0.054
89
- Toto-1.0,Toto-2.0-313m,0.0,0.0,0.0,-0.118,-0.215,-0.05
90
- Toto-1.0,Toto-2.0-22m,0.1,0.0,0.25,-0.062,-0.128,-0.021
91
- Toto-1.0,Chronos-2,0.65,0.45,0.85,-0.07,-0.211,0.014
92
- Toto-1.0,Toto-1.0,0.5,0.5,0.5,0.0,0.0,0.0
93
- Toto-1.0,Toto-2.0-4m,0.75,0.55,0.95,-0.0,-0.046,0.03
94
- Toto-1.0,TiRex-2,0.8,0.65,0.95,0.01,-0.05,0.046
95
- Toto-1.0,TimesFM-2.5,0.8,0.6,0.95,0.016,-0.049,0.069
96
- Toto-1.0,TiRex,0.75,0.55,0.9,0.046,-0.002,0.1
97
- Toto-1.0,FlowState,0.8,0.6,0.95,0.049,-0.12,0.172
98
- Toto-1.0,TabPFN-TS-3,0.85,0.699,1.0,0.016,-0.189,0.136
99
- Toto-1.0,TabPFN-TS,0.85,0.699,1.0,0.083,0.012,0.143
100
- Toto-1.0,Moirai-2.0,0.9,0.75,1.0,0.075,0.014,0.139
101
- Toto-1.0,PatchTST,0.9,0.75,1.0,0.076,-0.112,0.188
102
- Toto-1.0,Chronos-Bolt,0.95,0.85,1.0,0.12,0.051,0.182
103
- Toto-1.0,Seasonal Naive,1.0,1.0,1.0,0.471,0.37,0.58
104
- Toto-2.0-4m,Toto-2.0-2.5B,0.0,0.0,0.0,-0.143,-0.239,-0.07
105
- Toto-2.0-4m,Toto-2.0-1B,0.0,0.0,0.0,-0.128,-0.206,-0.066
106
- Toto-2.0-4m,Toto-2.0-313m,0.0,0.0,0.0,-0.118,-0.189,-0.063
107
- Toto-2.0-4m,Toto-2.0-22m,0.0,0.0,0.0,-0.062,-0.093,-0.036
108
- Toto-2.0-4m,Chronos-2,0.4,0.2,0.65,-0.07,-0.184,-0.005
109
- Toto-2.0-4m,Toto-1.0,0.25,0.05,0.45,0.0,-0.031,0.044
110
- Toto-2.0-4m,Toto-2.0-4m,0.5,0.5,0.5,0.0,0.0,0.0
111
- Toto-2.0-4m,TiRex-2,0.75,0.55,0.9,0.01,-0.012,0.033
112
- Toto-2.0-4m,TimesFM-2.5,0.7,0.5,0.9,0.016,-0.025,0.049
113
- Toto-2.0-4m,TiRex,0.75,0.55,0.9,0.047,0.016,0.086
114
- Toto-2.0-4m,FlowState,0.8,0.6,0.95,0.049,-0.109,0.156
115
- Toto-2.0-4m,TabPFN-TS-3,0.75,0.55,0.95,0.017,-0.155,0.119
116
- Toto-2.0-4m,TabPFN-TS,0.7,0.5,0.9,0.083,0.042,0.126
117
- Toto-2.0-4m,Moirai-2.0,0.9,0.75,1.0,0.075,0.041,0.122
118
- Toto-2.0-4m,PatchTST,0.9,0.75,1.0,0.076,-0.082,0.173
119
- Toto-2.0-4m,Chronos-Bolt,1.0,1.0,1.0,0.12,0.077,0.168
120
- Toto-2.0-4m,Seasonal Naive,1.0,1.0,1.0,0.471,0.364,0.579
121
- TiRex-2,Toto-2.0-2.5B,0.0,0.0,0.0,-0.155,-0.264,-0.079
122
- TiRex-2,Toto-2.0-1B,0.0,0.0,0.0,-0.14,-0.226,-0.074
123
- TiRex-2,Toto-2.0-313m,0.0,0.0,0.0,-0.13,-0.204,-0.073
124
- TiRex-2,Toto-2.0-22m,0.05,0.0,0.15,-0.073,-0.11,-0.044
125
- TiRex-2,Chronos-2,0.15,0.0,0.35,-0.081,-0.204,-0.013
126
- TiRex-2,Toto-1.0,0.2,0.05,0.35,-0.01,-0.049,0.047
127
- TiRex-2,Toto-2.0-4m,0.25,0.1,0.45,-0.01,-0.034,0.012
128
- TiRex-2,TiRex-2,0.5,0.5,0.5,0.0,0.0,0.0
129
- TiRex-2,TimesFM-2.5,0.65,0.45,0.85,0.006,-0.055,0.053
130
- TiRex-2,TiRex,0.65,0.45,0.85,0.037,0.003,0.082
131
- TiRex-2,FlowState,0.75,0.55,0.95,0.039,-0.135,0.155
132
- TiRex-2,TabPFN-TS-3,0.8,0.65,0.95,0.006,-0.176,0.12
133
- TiRex-2,TabPFN-TS,0.8,0.6,0.95,0.074,0.027,0.122
134
- TiRex-2,Moirai-2.0,0.8,0.6,0.95,0.066,0.026,0.12
135
- TiRex-2,PatchTST,0.95,0.85,1.0,0.066,-0.107,0.169
136
- TiRex-2,Chronos-Bolt,0.95,0.85,1.0,0.111,0.066,0.165
137
- TiRex-2,Seasonal Naive,1.0,1.0,1.0,0.466,0.355,0.579
138
- TimesFM-2.5,Toto-2.0-2.5B,0.05,0.0,0.15,-0.161,-0.255,-0.094
139
- TimesFM-2.5,Toto-2.0-1B,0.0,0.0,0.0,-0.146,-0.236,-0.088
140
- TimesFM-2.5,Toto-2.0-313m,0.0,0.0,0.0,-0.136,-0.22,-0.082
141
- TimesFM-2.5,Toto-2.0-22m,0.1,0.0,0.25,-0.079,-0.134,-0.037
142
- TimesFM-2.5,Chronos-2,0.25,0.1,0.45,-0.088,-0.162,-0.031
143
- TimesFM-2.5,Toto-1.0,0.2,0.05,0.4,-0.016,-0.074,0.047
144
- TimesFM-2.5,Toto-2.0-4m,0.3,0.1,0.5,-0.016,-0.052,0.025
145
- TimesFM-2.5,TiRex-2,0.35,0.15,0.55,-0.006,-0.056,0.052
146
- TimesFM-2.5,TimesFM-2.5,0.5,0.5,0.5,0.0,0.0,0.0
147
- TimesFM-2.5,TiRex,0.6,0.4,0.8,0.031,-0.009,0.083
148
- TimesFM-2.5,FlowState,0.8,0.6,0.95,0.033,-0.09,0.123
149
- TimesFM-2.5,TabPFN-TS-3,0.7,0.5,0.9,0.001,-0.121,0.081
150
- TimesFM-2.5,TabPFN-TS,0.75,0.55,0.95,0.068,0.034,0.105
151
- TimesFM-2.5,Moirai-2.0,0.85,0.65,1.0,0.06,0.024,0.101
152
- TimesFM-2.5,PatchTST,0.8,0.649,0.95,0.061,-0.066,0.141
153
- TimesFM-2.5,Chronos-Bolt,0.9,0.75,1.0,0.106,0.065,0.148
154
- TimesFM-2.5,Seasonal Naive,1.0,1.0,1.0,0.462,0.364,0.568
155
- TiRex,Toto-2.0-2.5B,0.0,0.0,0.0,-0.199,-0.346,-0.095
156
- TiRex,Toto-2.0-1B,0.0,0.0,0.0,-0.183,-0.313,-0.089
157
- TiRex,Toto-2.0-313m,0.0,0.0,0.0,-0.173,-0.296,-0.087
158
- TiRex,Toto-2.0-22m,0.05,0.0,0.15,-0.114,-0.191,-0.056
159
- TiRex,Chronos-2,0.2,0.05,0.4,-0.122,-0.264,-0.033
160
- TiRex,Toto-1.0,0.25,0.1,0.45,-0.049,-0.111,0.002
161
- TiRex,Toto-2.0-4m,0.25,0.1,0.45,-0.049,-0.094,-0.016
162
- TiRex,TiRex-2,0.35,0.15,0.55,-0.038,-0.09,-0.003
163
- TiRex,TimesFM-2.5,0.4,0.2,0.6,-0.032,-0.091,0.009
164
- TiRex,TiRex,0.5,0.5,0.5,0.0,0.0,0.0
165
- TiRex,FlowState,0.6,0.4,0.8,0.002,-0.176,0.116
166
- TiRex,TabPFN-TS-3,0.75,0.55,0.901,-0.031,-0.219,0.065
167
- TiRex,TabPFN-TS,0.7,0.5,0.9,0.038,-0.012,0.083
168
- TiRex,Moirai-2.0,0.75,0.55,0.9,0.03,0.004,0.056
169
- TiRex,PatchTST,0.75,0.55,0.9,0.031,-0.152,0.138
170
- TiRex,Chronos-Bolt,0.85,0.65,1.0,0.077,0.03,0.124
171
- TiRex,Seasonal Naive,1.0,1.0,1.0,0.445,0.35,0.545
172
- FlowState,Toto-2.0-2.5B,0.05,0.0,0.15,-0.201,-0.344,-0.085
173
- FlowState,Toto-2.0-1B,0.05,0.0,0.15,-0.186,-0.335,-0.059
174
- FlowState,Toto-2.0-313m,0.05,0.0,0.15,-0.175,-0.33,-0.04
175
- FlowState,Toto-2.0-22m,0.05,0.0,0.15,-0.116,-0.264,0.034
176
- FlowState,Chronos-2,0.2,0.05,0.4,-0.125,-0.224,-0.051
177
- FlowState,Toto-1.0,0.2,0.05,0.4,-0.051,-0.208,0.107
178
- FlowState,Toto-2.0-4m,0.2,0.05,0.4,-0.051,-0.185,0.099
179
- FlowState,TiRex-2,0.25,0.05,0.45,-0.04,-0.183,0.119
180
- FlowState,TimesFM-2.5,0.2,0.05,0.4,-0.035,-0.141,0.083
181
- FlowState,TiRex,0.4,0.2,0.6,-0.002,-0.131,0.149
182
- FlowState,FlowState,0.5,0.5,0.5,0.0,0.0,0.0
183
- FlowState,TabPFN-TS-3,0.5,0.3,0.7,-0.034,-0.124,0.05
184
- FlowState,TabPFN-TS,0.55,0.35,0.75,0.036,-0.086,0.162
185
- FlowState,Moirai-2.0,0.55,0.35,0.75,0.028,-0.093,0.164
186
- FlowState,PatchTST,0.6,0.4,0.8,0.029,-0.068,0.106
187
- FlowState,Chronos-Bolt,0.7,0.5,0.851,0.075,-0.004,0.187
188
- FlowState,Seasonal Naive,1.0,1.0,1.0,0.444,0.326,0.558
189
- TabPFN-TS-3,Toto-2.0-2.5B,0.05,0.0,0.15,-0.162,-0.325,-0.051
190
- TabPFN-TS-3,Toto-2.0-1B,0.05,0.0,0.15,-0.147,-0.313,-0.019
191
- TabPFN-TS-3,Toto-2.0-313m,0.05,0.0,0.15,-0.137,-0.3,0.004
192
- TabPFN-TS-3,Toto-2.0-22m,0.05,0.0,0.15,-0.08,-0.217,0.07
193
- TabPFN-TS-3,Chronos-2,0.15,0.0,0.35,-0.088,-0.184,-0.019
194
- TabPFN-TS-3,Toto-1.0,0.15,0.0,0.301,-0.017,-0.157,0.159
195
- TabPFN-TS-3,Toto-2.0-4m,0.25,0.05,0.45,-0.017,-0.135,0.134
196
- TabPFN-TS-3,TiRex-2,0.2,0.05,0.35,-0.006,-0.137,0.15
197
- TabPFN-TS-3,TimesFM-2.5,0.3,0.1,0.5,-0.001,-0.088,0.108
198
- TabPFN-TS-3,TiRex,0.25,0.099,0.45,0.03,-0.07,0.179
199
- TabPFN-TS-3,FlowState,0.5,0.3,0.7,0.033,-0.052,0.11
200
- TabPFN-TS-3,TabPFN-TS-3,0.5,0.5,0.5,0.0,0.0,0.0
201
- TabPFN-TS-3,TabPFN-TS,0.65,0.45,0.85,0.068,-0.013,0.181
202
- TabPFN-TS-3,Moirai-2.0,0.5,0.3,0.7,0.06,-0.026,0.187
203
- TabPFN-TS-3,PatchTST,0.5,0.3,0.7,0.06,-0.007,0.116
204
- TabPFN-TS-3,Chronos-Bolt,0.6,0.4,0.8,0.105,-0.001,0.226
205
- TabPFN-TS-3,Seasonal Naive,1.0,1.0,1.0,0.462,0.342,0.578
206
- TabPFN-TS,Toto-2.0-2.5B,0.0,0.0,0.0,-0.246,-0.363,-0.164
207
- TabPFN-TS,Toto-2.0-1B,0.0,0.0,0.0,-0.23,-0.341,-0.157
208
- TabPFN-TS,Toto-2.0-313m,0.0,0.0,0.0,-0.22,-0.324,-0.151
209
- TabPFN-TS,Toto-2.0-22m,0.1,0.0,0.25,-0.158,-0.228,-0.109
210
- TabPFN-TS,Chronos-2,0.05,0.0,0.15,-0.167,-0.275,-0.095
211
- TabPFN-TS,Toto-1.0,0.15,0.0,0.301,-0.091,-0.166,-0.012
212
- TabPFN-TS,Toto-2.0-4m,0.3,0.1,0.5,-0.091,-0.145,-0.043
213
- TabPFN-TS,TiRex-2,0.2,0.05,0.4,-0.08,-0.139,-0.028
214
- TabPFN-TS,TimesFM-2.5,0.25,0.05,0.45,-0.073,-0.118,-0.035
215
- TabPFN-TS,TiRex,0.3,0.1,0.5,-0.04,-0.091,0.012
216
- TabPFN-TS,FlowState,0.45,0.25,0.65,-0.038,-0.193,0.079
217
- TabPFN-TS,TabPFN-TS-3,0.35,0.15,0.55,-0.073,-0.221,0.013
218
- TabPFN-TS,TabPFN-TS,0.5,0.5,0.5,0.0,0.0,0.0
219
- TabPFN-TS,Moirai-2.0,0.45,0.2,0.65,-0.009,-0.056,0.034
220
- TabPFN-TS,PatchTST,0.45,0.25,0.65,-0.008,-0.175,0.096
221
- TabPFN-TS,Chronos-Bolt,0.55,0.35,0.75,0.04,-0.028,0.105
222
- TabPFN-TS,Seasonal Naive,1.0,1.0,1.0,0.423,0.304,0.541
223
- Moirai-2.0,Toto-2.0-2.5B,0.0,0.0,0.0,-0.236,-0.382,-0.129
224
- Moirai-2.0,Toto-2.0-1B,0.0,0.0,0.0,-0.22,-0.36,-0.122
225
- Moirai-2.0,Toto-2.0-313m,0.0,0.0,0.0,-0.209,-0.335,-0.121
226
- Moirai-2.0,Toto-2.0-22m,0.0,0.0,0.0,-0.149,-0.238,-0.089
227
- Moirai-2.0,Chronos-2,0.0,0.0,0.0,-0.157,-0.292,-0.062
228
- Moirai-2.0,Toto-1.0,0.1,0.0,0.25,-0.081,-0.162,-0.014
229
- Moirai-2.0,Toto-2.0-4m,0.1,0.0,0.25,-0.081,-0.139,-0.043
230
- Moirai-2.0,TiRex-2,0.2,0.05,0.4,-0.07,-0.136,-0.027
231
- Moirai-2.0,TimesFM-2.5,0.15,0.0,0.35,-0.064,-0.112,-0.025
232
- Moirai-2.0,TiRex,0.25,0.1,0.45,-0.031,-0.06,-0.004
233
- Moirai-2.0,FlowState,0.45,0.25,0.65,-0.029,-0.197,0.085
234
- Moirai-2.0,TabPFN-TS-3,0.5,0.3,0.7,-0.064,-0.23,0.026
235
- Moirai-2.0,TabPFN-TS,0.55,0.35,0.8,0.008,-0.035,0.053
236
- Moirai-2.0,Moirai-2.0,0.5,0.5,0.5,0.0,0.0,0.0
237
- Moirai-2.0,PatchTST,0.55,0.3,0.75,0.001,-0.174,0.1
238
- Moirai-2.0,Chronos-Bolt,0.75,0.55,0.9,0.048,0.003,0.096
239
- Moirai-2.0,Seasonal Naive,1.0,1.0,1.0,0.428,0.333,0.532
240
- PatchTST,Toto-2.0-2.5B,0.05,0.0,0.15,-0.237,-0.387,-0.105
241
- PatchTST,Toto-2.0-1B,0.05,0.0,0.15,-0.22,-0.379,-0.075
242
- PatchTST,Toto-2.0-313m,0.05,0.0,0.15,-0.21,-0.37,-0.055
243
- PatchTST,Toto-2.0-22m,0.05,0.0,0.15,-0.149,-0.294,0.013
244
- PatchTST,Chronos-2,0.15,0.0,0.3,-0.158,-0.258,-0.065
245
- PatchTST,Toto-1.0,0.1,0.0,0.25,-0.082,-0.232,0.1
246
- PatchTST,Toto-2.0-4m,0.1,0.0,0.25,-0.082,-0.209,0.075
247
- PatchTST,TiRex-2,0.05,0.0,0.15,-0.071,-0.204,0.097
248
- PatchTST,TimesFM-2.5,0.2,0.05,0.351,-0.065,-0.165,0.062
249
- PatchTST,TiRex,0.25,0.1,0.45,-0.032,-0.16,0.132
250
- PatchTST,FlowState,0.4,0.2,0.6,-0.029,-0.118,0.064
251
- PatchTST,TabPFN-TS-3,0.5,0.3,0.7,-0.064,-0.131,0.007
252
- PatchTST,TabPFN-TS,0.55,0.35,0.75,0.008,-0.107,0.149
253
- PatchTST,Moirai-2.0,0.45,0.25,0.7,-0.001,-0.111,0.148
254
- PatchTST,PatchTST,0.5,0.5,0.5,0.0,0.0,0.0
255
- PatchTST,Chronos-Bolt,0.5,0.3,0.7,0.048,-0.064,0.191
256
- PatchTST,Seasonal Naive,0.9,0.775,1.0,0.428,0.289,0.553
257
- Chronos-Bolt,Toto-2.0-2.5B,0.0,0.0,0.0,-0.298,-0.433,-0.184
258
- Chronos-Bolt,Toto-2.0-1B,0.0,0.0,0.0,-0.281,-0.399,-0.179
259
- Chronos-Bolt,Toto-2.0-313m,0.0,0.0,0.0,-0.271,-0.38,-0.178
260
- Chronos-Bolt,Toto-2.0-22m,0.0,0.0,0.0,-0.207,-0.287,-0.139
261
- Chronos-Bolt,Chronos-2,0.0,0.0,0.0,-0.216,-0.349,-0.115
262
- Chronos-Bolt,Toto-1.0,0.05,0.0,0.15,-0.136,-0.223,-0.053
263
- Chronos-Bolt,Toto-2.0-4m,0.0,0.0,0.0,-0.136,-0.201,-0.083
264
- Chronos-Bolt,TiRex-2,0.05,0.0,0.15,-0.125,-0.197,-0.071
265
- Chronos-Bolt,TimesFM-2.5,0.1,0.0,0.25,-0.118,-0.174,-0.069
266
- Chronos-Bolt,TiRex,0.15,0.0,0.35,-0.083,-0.141,-0.031
267
- Chronos-Bolt,FlowState,0.3,0.149,0.5,-0.081,-0.231,0.004
268
- Chronos-Bolt,TabPFN-TS-3,0.4,0.2,0.6,-0.117,-0.293,0.001
269
- Chronos-Bolt,TabPFN-TS,0.45,0.25,0.65,-0.042,-0.117,0.028
270
- Chronos-Bolt,Moirai-2.0,0.25,0.1,0.45,-0.051,-0.106,-0.003
271
- Chronos-Bolt,PatchTST,0.5,0.3,0.7,-0.05,-0.235,0.06
272
- Chronos-Bolt,Chronos-Bolt,0.5,0.5,0.5,0.0,0.0,0.0
273
- Chronos-Bolt,Seasonal Naive,1.0,1.0,1.0,0.399,0.295,0.512
274
- Seasonal Naive,Toto-2.0-2.5B,0.0,0.0,0.0,-1.16,-1.888,-0.726
275
- Seasonal Naive,Toto-2.0-1B,0.0,0.0,0.0,-1.132,-1.83,-0.721
276
- Seasonal Naive,Toto-2.0-313m,0.0,0.0,0.0,-1.114,-1.794,-0.707
277
- Seasonal Naive,Toto-2.0-22m,0.0,0.0,0.0,-1.008,-1.587,-0.645
278
- Seasonal Naive,Chronos-2,0.0,0.0,0.0,-1.023,-1.609,-0.634
279
- Seasonal Naive,Toto-1.0,0.0,0.0,0.0,-0.89,-1.38,-0.588
280
- Seasonal Naive,Toto-2.0-4m,0.0,0.0,0.0,-0.89,-1.375,-0.572
281
- Seasonal Naive,TiRex-2,0.0,0.0,0.0,-0.871,-1.377,-0.55
282
- Seasonal Naive,TimesFM-2.5,0.0,0.0,0.0,-0.86,-1.313,-0.572
283
- Seasonal Naive,TiRex,0.0,0.0,0.0,-0.802,-1.198,-0.539
284
- Seasonal Naive,FlowState,0.0,0.0,0.0,-0.798,-1.26,-0.483
285
- Seasonal Naive,TabPFN-TS-3,0.0,0.0,0.0,-0.859,-1.369,-0.521
286
- Seasonal Naive,TabPFN-TS,0.0,0.0,0.0,-0.733,-1.18,-0.436
287
- Seasonal Naive,Moirai-2.0,0.0,0.0,0.0,-0.748,-1.138,-0.499
288
- Seasonal Naive,PatchTST,0.1,0.0,0.225,-0.747,-1.237,-0.406
289
- Seasonal Naive,Chronos-Bolt,0.0,0.0,0.0,-0.664,-1.049,-0.418
290
- Seasonal Naive,Seasonal Naive,0.5,0.5,0.5,0.0,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_cloud/pairwise_WQL.csv DELETED
@@ -1,290 +0,0 @@
1
- model_1,model_2,win_rate,win_rate_lower,win_rate_upper,skill_score,skill_score_lower,skill_score_upper
2
- Toto-2.0-2.5B,Toto-2.0-2.5B,0.5,0.5,0.5,0.0,0.0,0.0
3
- Toto-2.0-2.5B,Toto-2.0-1B,0.75,0.55,0.9,0.009,-0.004,0.026
4
- Toto-2.0-2.5B,Toto-2.0-313m,0.9,0.75,1.0,0.02,-0.002,0.053
5
- Toto-2.0-2.5B,Toto-2.0-22m,1.0,1.0,1.0,0.068,0.033,0.117
6
- Toto-2.0-2.5B,Chronos-2,0.95,0.85,1.0,0.063,0.029,0.097
7
- Toto-2.0-2.5B,Toto-1.0,1.0,1.0,1.0,0.129,0.058,0.225
8
- Toto-2.0-2.5B,Toto-2.0-4m,1.0,1.0,1.0,0.13,0.069,0.205
9
- Toto-2.0-2.5B,TiRex-2,1.0,1.0,1.0,0.14,0.077,0.222
10
- Toto-2.0-2.5B,TimesFM-2.5,1.0,1.0,1.0,0.146,0.095,0.204
11
- Toto-2.0-2.5B,TiRex,1.0,1.0,1.0,0.169,0.091,0.263
12
- Toto-2.0-2.5B,TabPFN-TS-3,0.95,0.85,1.0,0.131,0.047,0.222
13
- Toto-2.0-2.5B,FlowState,0.95,0.85,1.0,0.171,0.084,0.255
14
- Toto-2.0-2.5B,Moirai-2.0,1.0,1.0,1.0,0.204,0.129,0.288
15
- Toto-2.0-2.5B,PatchTST,0.95,0.85,1.0,0.231,0.124,0.326
16
- Toto-2.0-2.5B,TFT,1.0,1.0,1.0,0.303,0.177,0.432
17
- Toto-2.0-2.5B,Chronos-Bolt,1.0,1.0,1.0,0.26,0.189,0.332
18
- Toto-2.0-2.5B,Seasonal Naive,1.0,1.0,1.0,0.69,0.609,0.766
19
- Toto-2.0-1B,Toto-2.0-2.5B,0.25,0.1,0.45,-0.009,-0.027,0.004
20
- Toto-2.0-1B,Toto-2.0-1B,0.5,0.5,0.5,0.0,0.0,0.0
21
- Toto-2.0-1B,Toto-2.0-313m,0.8,0.6,0.95,0.011,-0.002,0.03
22
- Toto-2.0-1B,Toto-2.0-22m,1.0,1.0,1.0,0.059,0.03,0.097
23
- Toto-2.0-1B,Chronos-2,0.95,0.85,1.0,0.055,0.005,0.095
24
- Toto-2.0-1B,Toto-1.0,1.0,1.0,1.0,0.121,0.056,0.205
25
- Toto-2.0-1B,Toto-2.0-4m,1.0,1.0,1.0,0.122,0.068,0.187
26
- Toto-2.0-1B,TiRex-2,1.0,1.0,1.0,0.132,0.076,0.205
27
- Toto-2.0-1B,TimesFM-2.5,1.0,1.0,1.0,0.138,0.091,0.191
28
- Toto-2.0-1B,TiRex,1.0,1.0,1.0,0.161,0.088,0.248
29
- Toto-2.0-1B,TabPFN-TS-3,0.95,0.85,1.0,0.123,0.025,0.223
30
- Toto-2.0-1B,FlowState,0.95,0.85,1.0,0.163,0.068,0.254
31
- Toto-2.0-1B,Moirai-2.0,1.0,1.0,1.0,0.197,0.125,0.279
32
- Toto-2.0-1B,PatchTST,0.95,0.85,1.0,0.224,0.107,0.322
33
- Toto-2.0-1B,TFT,1.0,1.0,1.0,0.297,0.176,0.423
34
- Toto-2.0-1B,Chronos-Bolt,1.0,1.0,1.0,0.253,0.186,0.32
35
- Toto-2.0-1B,Seasonal Naive,1.0,1.0,1.0,0.688,0.607,0.763
36
- Toto-2.0-313m,Toto-2.0-2.5B,0.1,0.0,0.25,-0.02,-0.056,0.002
37
- Toto-2.0-313m,Toto-2.0-1B,0.2,0.05,0.4,-0.011,-0.03,0.002
38
- Toto-2.0-313m,Toto-2.0-313m,0.5,0.5,0.5,0.0,0.0,0.0
39
- Toto-2.0-313m,Toto-2.0-22m,1.0,1.0,1.0,0.049,0.028,0.073
40
- Toto-2.0-313m,Chronos-2,0.9,0.75,1.0,0.044,-0.025,0.093
41
- Toto-2.0-313m,Toto-1.0,1.0,1.0,1.0,0.111,0.054,0.181
42
- Toto-2.0-313m,Toto-2.0-4m,1.0,1.0,1.0,0.112,0.065,0.165
43
- Toto-2.0-313m,TiRex-2,1.0,1.0,1.0,0.123,0.074,0.182
44
- Toto-2.0-313m,TimesFM-2.5,1.0,1.0,1.0,0.128,0.087,0.182
45
- Toto-2.0-313m,TiRex,1.0,1.0,1.0,0.152,0.086,0.227
46
- Toto-2.0-313m,TabPFN-TS-3,0.95,0.85,1.0,0.114,-0.005,0.22
47
- Toto-2.0-313m,FlowState,0.95,0.85,1.0,0.154,0.045,0.251
48
- Toto-2.0-313m,Moirai-2.0,1.0,1.0,1.0,0.188,0.124,0.259
49
- Toto-2.0-313m,PatchTST,0.95,0.85,1.0,0.216,0.083,0.318
50
- Toto-2.0-313m,TFT,1.0,1.0,1.0,0.289,0.173,0.418
51
- Toto-2.0-313m,Chronos-Bolt,1.0,1.0,1.0,0.245,0.185,0.304
52
- Toto-2.0-313m,Seasonal Naive,1.0,1.0,1.0,0.684,0.602,0.763
53
- Toto-2.0-22m,Toto-2.0-2.5B,0.0,0.0,0.0,-0.073,-0.133,-0.034
54
- Toto-2.0-22m,Toto-2.0-1B,0.0,0.0,0.0,-0.063,-0.107,-0.031
55
- Toto-2.0-22m,Toto-2.0-313m,0.0,0.0,0.0,-0.052,-0.079,-0.029
56
- Toto-2.0-22m,Toto-2.0-22m,0.5,0.5,0.5,0.0,0.0,0.0
57
- Toto-2.0-22m,Chronos-2,0.8,0.6,0.95,-0.005,-0.088,0.044
58
- Toto-2.0-22m,Toto-1.0,0.9,0.75,1.0,0.065,0.023,0.123
59
- Toto-2.0-22m,Toto-2.0-4m,1.0,1.0,1.0,0.066,0.036,0.1
60
- Toto-2.0-22m,TiRex-2,1.0,1.0,1.0,0.077,0.044,0.12
61
- Toto-2.0-22m,TimesFM-2.5,0.95,0.85,1.0,0.084,0.052,0.121
62
- Toto-2.0-22m,TiRex,0.95,0.85,1.0,0.108,0.057,0.168
63
- Toto-2.0-22m,TabPFN-TS-3,0.9,0.75,1.0,0.068,-0.074,0.168
64
- Toto-2.0-22m,FlowState,0.9,0.75,1.0,0.111,-0.022,0.213
65
- Toto-2.0-22m,Moirai-2.0,1.0,1.0,1.0,0.146,0.095,0.205
66
- Toto-2.0-22m,PatchTST,0.95,0.85,1.0,0.176,0.029,0.281
67
- Toto-2.0-22m,TFT,1.0,1.0,1.0,0.253,0.14,0.374
68
- Toto-2.0-22m,Chronos-Bolt,1.0,1.0,1.0,0.206,0.157,0.257
69
- Toto-2.0-22m,Seasonal Naive,1.0,1.0,1.0,0.668,0.584,0.745
70
- Chronos-2,Toto-2.0-2.5B,0.05,0.0,0.15,-0.068,-0.107,-0.03
71
- Chronos-2,Toto-2.0-1B,0.05,0.0,0.15,-0.058,-0.105,-0.005
72
- Chronos-2,Toto-2.0-313m,0.1,0.0,0.25,-0.046,-0.103,0.024
73
- Chronos-2,Toto-2.0-22m,0.2,0.05,0.4,0.005,-0.046,0.081
74
- Chronos-2,Chronos-2,0.5,0.5,0.5,0.0,0.0,0.0
75
- Chronos-2,Toto-1.0,0.35,0.15,0.55,0.07,-0.014,0.185
76
- Chronos-2,Toto-2.0-4m,0.6,0.35,0.8,0.071,0.004,0.171
77
- Chronos-2,TiRex-2,0.8,0.6,0.95,0.082,0.016,0.185
78
- Chronos-2,TimesFM-2.5,0.75,0.55,0.9,0.088,0.033,0.155
79
- Chronos-2,TiRex,0.85,0.7,1.0,0.113,0.032,0.222
80
- Chronos-2,TabPFN-TS-3,0.9,0.75,1.0,0.072,0.011,0.147
81
- Chronos-2,FlowState,0.85,0.65,1.0,0.115,0.05,0.188
82
- Chronos-2,Moirai-2.0,1.0,1.0,1.0,0.151,0.066,0.248
83
- Chronos-2,PatchTST,0.85,0.7,1.0,0.18,0.08,0.27
84
- Chronos-2,TFT,0.95,0.85,1.0,0.256,0.118,0.395
85
- Chronos-2,Chronos-Bolt,1.0,1.0,1.0,0.21,0.134,0.3
86
- Chronos-2,Seasonal Naive,1.0,1.0,1.0,0.669,0.582,0.746
87
- Toto-1.0,Toto-2.0-2.5B,0.0,0.0,0.0,-0.148,-0.291,-0.061
88
- Toto-1.0,Toto-2.0-1B,0.0,0.0,0.0,-0.137,-0.257,-0.06
89
- Toto-1.0,Toto-2.0-313m,0.0,0.0,0.0,-0.125,-0.222,-0.057
90
- Toto-1.0,Toto-2.0-22m,0.1,0.0,0.25,-0.07,-0.141,-0.024
91
- Toto-1.0,Chronos-2,0.65,0.45,0.85,-0.075,-0.227,0.014
92
- Toto-1.0,Toto-1.0,0.5,0.5,0.5,0.0,0.0,0.0
93
- Toto-1.0,Toto-2.0-4m,0.6,0.4,0.8,0.001,-0.04,0.028
94
- Toto-1.0,TiRex-2,0.8,0.65,0.95,0.013,-0.041,0.047
95
- Toto-1.0,TimesFM-2.5,0.75,0.55,0.95,0.02,-0.047,0.073
96
- Toto-1.0,TiRex,0.75,0.55,0.9,0.046,0.0,0.095
97
- Toto-1.0,TabPFN-TS-3,0.8,0.6,0.95,0.003,-0.211,0.127
98
- Toto-1.0,FlowState,0.75,0.55,0.9,0.049,-0.131,0.178
99
- Toto-1.0,Moirai-2.0,0.85,0.7,1.0,0.087,0.029,0.145
100
- Toto-1.0,PatchTST,0.9,0.75,1.0,0.118,-0.078,0.246
101
- Toto-1.0,TFT,1.0,1.0,1.0,0.2,0.108,0.294
102
- Toto-1.0,Chronos-Bolt,0.95,0.85,1.0,0.151,0.089,0.21
103
- Toto-1.0,Seasonal Naive,1.0,1.0,1.0,0.645,0.563,0.725
104
- Toto-2.0-4m,Toto-2.0-2.5B,0.0,0.0,0.0,-0.149,-0.258,-0.075
105
- Toto-2.0-4m,Toto-2.0-1B,0.0,0.0,0.0,-0.139,-0.23,-0.073
106
- Toto-2.0-4m,Toto-2.0-313m,0.0,0.0,0.0,-0.126,-0.198,-0.069
107
- Toto-2.0-4m,Toto-2.0-22m,0.0,0.0,0.0,-0.071,-0.112,-0.038
108
- Toto-2.0-4m,Chronos-2,0.4,0.2,0.65,-0.076,-0.207,-0.004
109
- Toto-2.0-4m,Toto-1.0,0.4,0.2,0.6,-0.001,-0.029,0.038
110
- Toto-2.0-4m,Toto-2.0-4m,0.5,0.5,0.5,0.0,0.0,0.0
111
- Toto-2.0-4m,TiRex-2,0.65,0.45,0.85,0.012,-0.009,0.034
112
- Toto-2.0-4m,TimesFM-2.5,0.6,0.4,0.8,0.019,-0.028,0.056
113
- Toto-2.0-4m,TiRex,0.8,0.649,0.95,0.045,0.016,0.082
114
- Toto-2.0-4m,TabPFN-TS-3,0.75,0.55,0.95,0.002,-0.182,0.109
115
- Toto-2.0-4m,FlowState,0.85,0.7,1.0,0.048,-0.128,0.162
116
- Toto-2.0-4m,Moirai-2.0,0.9,0.75,1.0,0.086,0.049,0.128
117
- Toto-2.0-4m,PatchTST,0.95,0.85,1.0,0.117,-0.066,0.232
118
- Toto-2.0-4m,TFT,0.9,0.75,1.0,0.2,0.09,0.31
119
- Toto-2.0-4m,Chronos-Bolt,1.0,1.0,1.0,0.15,0.107,0.197
120
- Toto-2.0-4m,Seasonal Naive,1.0,1.0,1.0,0.644,0.559,0.727
121
- TiRex-2,Toto-2.0-2.5B,0.0,0.0,0.0,-0.163,-0.286,-0.084
122
- TiRex-2,Toto-2.0-1B,0.0,0.0,0.0,-0.152,-0.258,-0.082
123
- TiRex-2,Toto-2.0-313m,0.0,0.0,0.0,-0.14,-0.222,-0.08
124
- TiRex-2,Toto-2.0-22m,0.0,0.0,0.0,-0.084,-0.136,-0.046
125
- TiRex-2,Chronos-2,0.2,0.05,0.4,-0.089,-0.227,-0.017
126
- TiRex-2,Toto-1.0,0.2,0.05,0.35,-0.013,-0.049,0.039
127
- TiRex-2,Toto-2.0-4m,0.35,0.15,0.55,-0.012,-0.035,0.009
128
- TiRex-2,TiRex-2,0.5,0.5,0.5,0.0,0.0,0.0
129
- TiRex-2,TimesFM-2.5,0.65,0.45,0.85,0.007,-0.056,0.053
130
- TiRex-2,TiRex,0.65,0.45,0.85,0.034,0.004,0.075
131
- TiRex-2,TabPFN-TS-3,0.75,0.6,0.9,-0.01,-0.207,0.11
132
- TiRex-2,FlowState,0.75,0.55,0.95,0.036,-0.151,0.155
133
- TiRex-2,Moirai-2.0,0.95,0.85,1.0,0.075,0.041,0.122
134
- TiRex-2,PatchTST,0.9,0.75,1.0,0.106,-0.096,0.232
135
- TiRex-2,TFT,0.85,0.7,0.95,0.19,0.073,0.312
136
- TiRex-2,Chronos-Bolt,1.0,1.0,1.0,0.14,0.099,0.185
137
- TiRex-2,Seasonal Naive,1.0,1.0,1.0,0.64,0.55,0.728
138
- TimesFM-2.5,Toto-2.0-2.5B,0.0,0.0,0.0,-0.171,-0.256,-0.105
139
- TimesFM-2.5,Toto-2.0-1B,0.0,0.0,0.0,-0.16,-0.236,-0.1
140
- TimesFM-2.5,Toto-2.0-313m,0.0,0.0,0.0,-0.147,-0.223,-0.095
141
- TimesFM-2.5,Toto-2.0-22m,0.05,0.0,0.15,-0.091,-0.138,-0.055
142
- TimesFM-2.5,Chronos-2,0.25,0.1,0.45,-0.097,-0.183,-0.034
143
- TimesFM-2.5,Toto-1.0,0.25,0.05,0.45,-0.02,-0.079,0.045
144
- TimesFM-2.5,Toto-2.0-4m,0.4,0.2,0.6,-0.019,-0.059,0.027
145
- TimesFM-2.5,TiRex-2,0.35,0.15,0.55,-0.007,-0.056,0.053
146
- TimesFM-2.5,TimesFM-2.5,0.5,0.5,0.5,0.0,0.0,0.0
147
- TimesFM-2.5,TiRex,0.6,0.4,0.8,0.027,-0.018,0.086
148
- TimesFM-2.5,TabPFN-TS-3,0.6,0.4,0.8,-0.017,-0.149,0.071
149
- TimesFM-2.5,FlowState,0.7,0.5,0.9,0.03,-0.104,0.121
150
- TimesFM-2.5,Moirai-2.0,0.85,0.65,1.0,0.069,0.028,0.116
151
- TimesFM-2.5,PatchTST,0.85,0.7,1.0,0.1,-0.044,0.208
152
- TimesFM-2.5,TFT,0.8,0.6,0.95,0.184,0.06,0.307
153
- TimesFM-2.5,Chronos-Bolt,0.9,0.75,1.0,0.134,0.092,0.179
154
- TimesFM-2.5,Seasonal Naive,1.0,1.0,1.0,0.638,0.557,0.714
155
- TiRex,Toto-2.0-2.5B,0.0,0.0,0.0,-0.203,-0.356,-0.1
156
- TiRex,Toto-2.0-1B,0.0,0.0,0.0,-0.192,-0.33,-0.096
157
- TiRex,Toto-2.0-313m,0.0,0.0,0.0,-0.179,-0.294,-0.094
158
- TiRex,Toto-2.0-22m,0.05,0.0,0.15,-0.122,-0.202,-0.061
159
- TiRex,Chronos-2,0.15,0.0,0.3,-0.127,-0.285,-0.033
160
- TiRex,Toto-1.0,0.25,0.1,0.45,-0.048,-0.105,-0.0
161
- TiRex,Toto-2.0-4m,0.2,0.05,0.351,-0.047,-0.089,-0.016
162
- TiRex,TiRex-2,0.35,0.15,0.55,-0.035,-0.081,-0.004
163
- TiRex,TimesFM-2.5,0.4,0.2,0.6,-0.028,-0.095,0.018
164
- TiRex,TiRex,0.5,0.5,0.5,0.0,0.0,0.0
165
- TiRex,TabPFN-TS-3,0.7,0.5,0.9,-0.045,-0.247,0.06
166
- TiRex,FlowState,0.7,0.5,0.9,0.003,-0.19,0.122
167
- TiRex,Moirai-2.0,0.9,0.75,1.0,0.043,0.019,0.07
168
- TiRex,PatchTST,0.8,0.6,0.95,0.075,-0.133,0.211
169
- TiRex,TFT,0.85,0.7,0.95,0.162,0.034,0.285
170
- TiRex,Chronos-Bolt,0.9,0.75,1.0,0.11,0.064,0.155
171
- TiRex,Seasonal Naive,1.0,1.0,1.0,0.627,0.54,0.71
172
- TabPFN-TS-3,Toto-2.0-2.5B,0.05,0.0,0.15,-0.151,-0.285,-0.049
173
- TabPFN-TS-3,Toto-2.0-1B,0.05,0.0,0.15,-0.141,-0.286,-0.025
174
- TabPFN-TS-3,Toto-2.0-313m,0.05,0.0,0.15,-0.128,-0.282,0.005
175
- TabPFN-TS-3,Toto-2.0-22m,0.1,0.0,0.25,-0.073,-0.202,0.069
176
- TabPFN-TS-3,Chronos-2,0.1,0.0,0.25,-0.078,-0.172,-0.012
177
- TabPFN-TS-3,Toto-1.0,0.2,0.05,0.4,-0.003,-0.146,0.175
178
- TabPFN-TS-3,Toto-2.0-4m,0.25,0.05,0.45,-0.002,-0.123,0.154
179
- TabPFN-TS-3,TiRex-2,0.25,0.1,0.4,0.01,-0.124,0.172
180
- TabPFN-TS-3,TimesFM-2.5,0.4,0.2,0.6,0.017,-0.077,0.13
181
- TabPFN-TS-3,TiRex,0.3,0.1,0.5,0.043,-0.064,0.198
182
- TabPFN-TS-3,TabPFN-TS-3,0.5,0.5,0.5,0.0,0.0,0.0
183
- TabPFN-TS-3,FlowState,0.5,0.3,0.7,0.046,-0.042,0.123
184
- TabPFN-TS-3,Moirai-2.0,0.6,0.399,0.8,0.084,-0.013,0.224
185
- TabPFN-TS-3,PatchTST,0.7,0.5,0.9,0.115,0.011,0.208
186
- TabPFN-TS-3,TFT,0.7,0.5,0.9,0.198,0.019,0.365
187
- TabPFN-TS-3,Chronos-Bolt,0.85,0.65,1.0,0.148,0.036,0.276
188
- TabPFN-TS-3,Seasonal Naive,1.0,1.0,1.0,0.644,0.549,0.724
189
- FlowState,Toto-2.0-2.5B,0.05,0.0,0.15,-0.206,-0.343,-0.092
190
- FlowState,Toto-2.0-1B,0.05,0.0,0.15,-0.195,-0.34,-0.073
191
- FlowState,Toto-2.0-313m,0.05,0.0,0.15,-0.182,-0.334,-0.047
192
- FlowState,Toto-2.0-22m,0.1,0.0,0.25,-0.124,-0.271,0.021
193
- FlowState,Chronos-2,0.15,0.0,0.35,-0.13,-0.232,-0.053
194
- FlowState,Toto-1.0,0.25,0.1,0.45,-0.051,-0.217,0.116
195
- FlowState,Toto-2.0-4m,0.15,0.0,0.3,-0.05,-0.194,0.113
196
- FlowState,TiRex-2,0.25,0.05,0.45,-0.037,-0.184,0.131
197
- FlowState,TimesFM-2.5,0.3,0.1,0.5,-0.03,-0.137,0.094
198
- FlowState,TiRex,0.3,0.1,0.5,-0.003,-0.139,0.159
199
- FlowState,TabPFN-TS-3,0.5,0.3,0.7,-0.048,-0.141,0.04
200
- FlowState,FlowState,0.5,0.5,0.5,0.0,0.0,0.0
201
- FlowState,Moirai-2.0,0.5,0.25,0.7,0.04,-0.089,0.189
202
- FlowState,PatchTST,0.6,0.4,0.8,0.073,-0.056,0.185
203
- FlowState,TFT,0.65,0.45,0.85,0.16,-0.028,0.323
204
- FlowState,Chronos-Bolt,0.8,0.649,0.95,0.107,0.023,0.228
205
- FlowState,Seasonal Naive,1.0,1.0,1.0,0.626,0.538,0.704
206
- Moirai-2.0,Toto-2.0-2.5B,0.0,0.0,0.0,-0.257,-0.404,-0.148
207
- Moirai-2.0,Toto-2.0-1B,0.0,0.0,0.0,-0.245,-0.387,-0.143
208
- Moirai-2.0,Toto-2.0-313m,0.0,0.0,0.0,-0.232,-0.35,-0.142
209
- Moirai-2.0,Toto-2.0-22m,0.0,0.0,0.0,-0.171,-0.257,-0.105
210
- Moirai-2.0,Chronos-2,0.0,0.0,0.0,-0.177,-0.33,-0.071
211
- Moirai-2.0,Toto-1.0,0.15,0.0,0.3,-0.095,-0.17,-0.03
212
- Moirai-2.0,Toto-2.0-4m,0.1,0.0,0.25,-0.094,-0.147,-0.052
213
- Moirai-2.0,TiRex-2,0.05,0.0,0.15,-0.081,-0.139,-0.043
214
- Moirai-2.0,TimesFM-2.5,0.15,0.0,0.35,-0.074,-0.131,-0.029
215
- Moirai-2.0,TiRex,0.1,0.0,0.25,-0.044,-0.075,-0.02
216
- Moirai-2.0,TabPFN-TS-3,0.4,0.2,0.601,-0.092,-0.288,0.013
217
- Moirai-2.0,FlowState,0.5,0.3,0.75,-0.042,-0.233,0.082
218
- Moirai-2.0,Moirai-2.0,0.5,0.5,0.5,0.0,0.0,0.0
219
- Moirai-2.0,PatchTST,0.6,0.4,0.8,0.034,-0.175,0.172
220
- Moirai-2.0,TFT,0.7,0.5,0.9,0.124,-0.012,0.26
221
- Moirai-2.0,Chronos-Bolt,0.85,0.699,0.975,0.07,0.023,0.118
222
- Moirai-2.0,Seasonal Naive,1.0,1.0,1.0,0.611,0.523,0.693
223
- PatchTST,Toto-2.0-2.5B,0.05,0.0,0.15,-0.301,-0.483,-0.142
224
- PatchTST,Toto-2.0-1B,0.05,0.0,0.15,-0.289,-0.474,-0.119
225
- PatchTST,Toto-2.0-313m,0.05,0.0,0.15,-0.275,-0.467,-0.091
226
- PatchTST,Toto-2.0-22m,0.05,0.0,0.15,-0.213,-0.392,-0.029
227
- PatchTST,Chronos-2,0.15,0.0,0.3,-0.219,-0.369,-0.087
228
- PatchTST,Toto-1.0,0.1,0.0,0.25,-0.134,-0.327,0.072
229
- PatchTST,Toto-2.0-4m,0.05,0.0,0.15,-0.133,-0.303,0.062
230
- PatchTST,TiRex-2,0.1,0.0,0.25,-0.119,-0.302,0.088
231
- PatchTST,TimesFM-2.5,0.15,0.0,0.3,-0.112,-0.262,0.042
232
- PatchTST,TiRex,0.2,0.05,0.4,-0.081,-0.267,0.118
233
- PatchTST,TabPFN-TS-3,0.3,0.1,0.5,-0.13,-0.262,-0.011
234
- PatchTST,FlowState,0.4,0.2,0.6,-0.079,-0.227,0.053
235
- PatchTST,Moirai-2.0,0.4,0.2,0.6,-0.035,-0.208,0.149
236
- PatchTST,PatchTST,0.5,0.5,0.5,0.0,0.0,0.0
237
- PatchTST,TFT,0.425,0.225,0.625,0.093,-0.057,0.271
238
- PatchTST,Chronos-Bolt,0.6,0.4,0.8,0.037,-0.124,0.209
239
- PatchTST,Seasonal Naive,0.9,0.75,1.0,0.597,0.477,0.698
240
- TFT,Toto-2.0-2.5B,0.0,0.0,0.0,-0.435,-0.762,-0.215
241
- TFT,Toto-2.0-1B,0.0,0.0,0.0,-0.422,-0.733,-0.214
242
- TFT,Toto-2.0-313m,0.0,0.0,0.0,-0.407,-0.717,-0.209
243
- TFT,Toto-2.0-22m,0.0,0.0,0.0,-0.338,-0.598,-0.163
244
- TFT,Chronos-2,0.05,0.0,0.15,-0.344,-0.652,-0.133
245
- TFT,Toto-1.0,0.0,0.0,0.0,-0.251,-0.415,-0.121
246
- TFT,Toto-2.0-4m,0.1,0.0,0.25,-0.249,-0.449,-0.099
247
- TFT,TiRex-2,0.15,0.05,0.3,-0.234,-0.453,-0.079
248
- TFT,TimesFM-2.5,0.2,0.05,0.4,-0.226,-0.442,-0.064
249
- TFT,TiRex,0.15,0.05,0.3,-0.193,-0.399,-0.035
250
- TFT,TabPFN-TS-3,0.3,0.1,0.5,-0.247,-0.574,-0.019
251
- TFT,FlowState,0.35,0.15,0.55,-0.19,-0.477,0.027
252
- TFT,Moirai-2.0,0.3,0.1,0.5,-0.142,-0.351,0.012
253
- TFT,PatchTST,0.575,0.375,0.775,-0.103,-0.372,0.054
254
- TFT,TFT,0.5,0.5,0.5,0.0,0.0,0.0
255
- TFT,Chronos-Bolt,0.5,0.3,0.7,-0.062,-0.262,0.087
256
- TFT,Seasonal Naive,0.9,0.75,1.0,0.556,0.443,0.658
257
- Chronos-Bolt,Toto-2.0-2.5B,0.0,0.0,0.0,-0.351,-0.498,-0.233
258
- Chronos-Bolt,Toto-2.0-1B,0.0,0.0,0.0,-0.339,-0.471,-0.228
259
- Chronos-Bolt,Toto-2.0-313m,0.0,0.0,0.0,-0.325,-0.437,-0.227
260
- Chronos-Bolt,Toto-2.0-22m,0.0,0.0,0.0,-0.26,-0.345,-0.186
261
- Chronos-Bolt,Chronos-2,0.0,0.0,0.0,-0.266,-0.429,-0.154
262
- Chronos-Bolt,Toto-1.0,0.05,0.0,0.15,-0.177,-0.267,-0.098
263
- Chronos-Bolt,Toto-2.0-4m,0.0,0.0,0.0,-0.176,-0.246,-0.12
264
- Chronos-Bolt,TiRex-2,0.0,0.0,0.0,-0.162,-0.227,-0.11
265
- Chronos-Bolt,TimesFM-2.5,0.1,0.0,0.25,-0.154,-0.218,-0.101
266
- Chronos-Bolt,TiRex,0.1,0.0,0.25,-0.123,-0.183,-0.069
267
- Chronos-Bolt,TabPFN-TS-3,0.15,0.0,0.35,-0.174,-0.382,-0.037
268
- Chronos-Bolt,FlowState,0.2,0.05,0.351,-0.12,-0.295,-0.023
269
- Chronos-Bolt,Moirai-2.0,0.15,0.025,0.301,-0.075,-0.134,-0.024
270
- Chronos-Bolt,PatchTST,0.4,0.2,0.6,-0.039,-0.264,0.11
271
- Chronos-Bolt,TFT,0.5,0.3,0.7,0.059,-0.096,0.207
272
- Chronos-Bolt,Chronos-Bolt,0.5,0.5,0.5,0.0,0.0,0.0
273
- Chronos-Bolt,Seasonal Naive,1.0,1.0,1.0,0.582,0.486,0.675
274
- Seasonal Naive,Toto-2.0-2.5B,0.0,0.0,0.0,-2.229,-3.277,-1.556
275
- Seasonal Naive,Toto-2.0-1B,0.0,0.0,0.0,-2.201,-3.228,-1.546
276
- Seasonal Naive,Toto-2.0-313m,0.0,0.0,0.0,-2.166,-3.211,-1.516
277
- Seasonal Naive,Toto-2.0-22m,0.0,0.0,0.0,-2.011,-2.926,-1.406
278
- Seasonal Naive,Chronos-2,0.0,0.0,0.0,-2.025,-2.936,-1.394
279
- Seasonal Naive,Toto-1.0,0.0,0.0,0.0,-1.814,-2.639,-1.287
280
- Seasonal Naive,Toto-2.0-4m,0.0,0.0,0.0,-1.811,-2.664,-1.269
281
- Seasonal Naive,TiRex-2,0.0,0.0,0.0,-1.778,-2.67,-1.221
282
- Seasonal Naive,TimesFM-2.5,0.0,0.0,0.0,-1.759,-2.495,-1.259
283
- Seasonal Naive,TiRex,0.0,0.0,0.0,-1.684,-2.448,-1.175
284
- Seasonal Naive,TabPFN-TS-3,0.0,0.0,0.0,-1.806,-2.622,-1.215
285
- Seasonal Naive,FlowState,0.0,0.0,0.0,-1.677,-2.381,-1.163
286
- Seasonal Naive,Moirai-2.0,0.0,0.0,0.0,-1.57,-2.259,-1.095
287
- Seasonal Naive,PatchTST,0.1,0.0,0.25,-1.482,-2.307,-0.914
288
- Seasonal Naive,TFT,0.1,0.0,0.25,-1.25,-1.926,-0.795
289
- Seasonal Naive,Chronos-Bolt,0.0,0.0,0.0,-1.39,-2.073,-0.945
290
- Seasonal Naive,Seasonal Naive,0.5,0.5,0.5,0.0,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_econ/leaderboard_MASE.csv DELETED
@@ -1,29 +0,0 @@
1
- model_name,win_rate,skill_score,median_training_time_s_per100,median_inference_time_s_per100,training_corpus_overlap,num_failures
2
- TiRex-2,89.50617283950616,40.553930524399625,0.0,0.11294837920086495,0.0,0.0
3
- Stat. Ensemble,79.320987654321,38.47702197421158,0.0,73.43481351955408,0.0,0.0
4
- Toto-2.0-22m,74.69135802469134,37.883510512986405,0.0,0.2300832338301921,0.0,0.0
5
- Toto-2.0-1B,72.83950617283949,37.647796213911036,0.0,2.4167769806179775,0.0,0.0
6
- Toto-2.0-313m,70.06172839506173,37.637104246897856,0.0,0.9865880503225806,0.0,0.0
7
- Toto-2.0-2.5B,69.7530864197531,37.649421436010044,0.0,5.236902611304615,0.0,0.0
8
- TiRex,67.59259259259261,36.87592044073875,0.0,0.16472977363175062,0.0,0.0
9
- Chronos-2,67.5925925925926,36.307128273958256,0.0,0.14791438772454144,0.0,0.0
10
- LightGBM,66.358024691358,36.739370201928836,0.20454036927361854,0.03409663050126502,0.0,0.0
11
- AutoETS,63.58024691358024,35.908870624227376,0.0,1.5253584038361796,0.0,0.0
12
- FlowState,62.34567901234568,35.21482359572895,0.0,0.8205954025996205,0.16666666666666666,0.0
13
- CatBoost,61.41975308641976,35.982559330359685,3.42108969184492,0.03905346701454776,0.0,0.0
14
- Toto-2.0-4m,56.48148148148149,35.180832137280916,0.0,0.1810118077664009,0.0,0.0
15
- Toto-1.0,56.172839506172835,32.41516602344565,0.0,5.0937543479594325,0.16666666666666666,0.0
16
- AutoARIMA,52.160493827160494,33.893658085803416,0.0,6.5345976113161015,0.0,0.0
17
- TabPFN-TS,48.76543209876543,34.19057001716027,0.0,52.326198869129215,0.0,0.0
18
- AutoTheta,48.456790123456784,32.52926186802178,0.0,0.9578271612919038,0.0,0.0
19
- Drift,46.29629629629629,29.639454067966152,0.0,0.4198026182352941,0.0,0.0
20
- TimesFM-2.5,45.98765432098766,32.83344751489832,0.0,0.3095206282094962,0.16666666666666666,0.0
21
- Chronos-Bolt,36.111111111111114,30.133730029400986,0.0,0.1587546411616528,0.0,0.0
22
- TabPFN-TS-3,36.11111111111111,28.575629786307356,0.0,190.9822121554963,0.0,0.0
23
- Moirai-2.0,35.49382716049383,28.236498726126015,0.0,0.21986280235955058,0.16666666666666666,0.0
24
- DeepAR,27.469135802469136,24.302560020818376,546.7685936688092,0.18274403532732447,0.0,0.0
25
- Sundial-Base,19.444444444444443,19.70951503418047,0.0,8.00438149490214,0.0,0.0
26
- PatchTST,14.506172839506174,15.279108700450617,310.3190003231231,0.1605401314516129,0.0,0.0
27
- Naive,13.271604938271608,15.593612422240255,0.0,0.46331807906862743,0.0,0.0
28
- TFT,11.111111111111112,9.838087249658834,445.02348117965687,0.18857640938013914,0.0,0.0
29
- Seasonal Naive,7.098765432098765,0.0,0.0,0.41450250024509805,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_econ/leaderboard_SQL.csv DELETED
@@ -1,29 +0,0 @@
1
- model_name,win_rate,skill_score,median_training_time_s_per100,median_inference_time_s_per100,training_corpus_overlap,num_failures
2
- TiRex-2,92.90123456790123,41.37587435805797,0.0,0.11294837920086495,0.0,0.0
3
- Chronos-2,78.08641975308643,37.73601252203713,0.0,0.14791438772454144,0.0,0.0
4
- Toto-2.0-2.5B,78.08641975308642,38.54527045088485,0.0,5.236902611304615,0.0,0.0
5
- TiRex,77.77777777777779,38.16787226217255,0.0,0.16472977363175062,0.0,0.0
6
- Toto-2.0-1B,77.77777777777779,38.30540837943911,0.0,2.4167769806179775,0.0,0.0
7
- Toto-2.0-22m,77.46913580246914,38.28322277552283,0.0,0.2300832338301921,0.0,0.0
8
- Toto-2.0-313m,77.46913580246914,38.27714813601945,0.0,0.9865880503225806,0.0,0.0
9
- Stat. Ensemble,70.67901234567903,37.119576639717835,0.0,73.43481351955408,0.0,0.0
10
- FlowState,66.35802469135803,35.273957411546085,0.0,0.8205954025996205,0.16666666666666666,0.0
11
- Toto-2.0-4m,62.96296296296296,35.90432755342822,0.0,0.1810118077664009,0.0,0.0
12
- Toto-1.0,59.56790123456791,33.496371356107844,0.0,5.0937543479594325,0.16666666666666666,0.0
13
- TabPFN-TS,59.5679012345679,35.173459448094114,0.0,52.326198869129215,0.0,0.0
14
- AutoETS,56.79012345679012,29.18586393990128,0.0,1.5253584038361796,0.0,0.0
15
- TimesFM-2.5,50.92592592592594,32.772070331944484,0.0,0.3095206282094962,0.16666666666666666,0.0
16
- AutoARIMA,48.76543209876543,31.72145242450589,0.0,6.5345976113161015,0.0,0.0
17
- Chronos-Bolt,47.22222222222223,31.81815534740079,0.0,0.1587546411616528,0.0,0.0
18
- Moirai-2.0,40.74074074074074,29.079628766325204,0.0,0.21986280235955058,0.16666666666666666,0.0
19
- AutoTheta,40.123456790123456,29.61896808086114,0.0,0.9578271612919038,0.0,0.0
20
- Drift,39.50617283950618,25.58270375016218,0.0,0.4198026182352941,0.0,0.0
21
- TabPFN-TS-3,39.19753086419753,29.19971717461506,0.0,190.9822121554963,0.0,0.0
22
- DeepAR,37.03703703703703,25.12762288287479,546.7685936688092,0.18274403532732447,0.0,0.0
23
- LightGBM,27.777777777777775,24.325044506495818,0.20454036927361854,0.03409663050126502,0.0,0.0
24
- CatBoost,22.839506172839506,23.419716355230047,3.42108969184492,0.03905346701454776,0.0,0.0
25
- PatchTST,19.753086419753085,16.930294384775955,310.3190003231231,0.1605401314516129,0.0,0.0
26
- Sundial-Base,15.74074074074074,14.510260955147846,0.0,8.00438149490214,0.0,0.0
27
- Naive,13.88888888888889,11.510640002523509,0.0,0.46331807906862743,0.0,0.0
28
- TFT,13.580246913580249,9.329379481293765,445.02348117965687,0.18857640938013914,0.0,0.0
29
- Seasonal Naive,7.4074074074074066,0.0,0.0,0.41450250024509805,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_econ/leaderboard_WAPE.csv DELETED
@@ -1,29 +0,0 @@
1
- model_name,win_rate,skill_score,median_training_time_s_per100,median_inference_time_s_per100,training_corpus_overlap,num_failures
2
- TiRex-2,87.96296296296296,42.13247790984753,0.0,0.11294837920086495,0.0,0.0
3
- Toto-2.0-1B,79.320987654321,38.80502192761649,0.0,2.4167769806179775,0.0,0.0
4
- Toto-2.0-2.5B,78.39506172839506,39.10703314170318,0.0,5.236902611304615,0.0,0.0
5
- Toto-2.0-313m,74.38271604938271,38.257695402459,0.0,0.9865880503225806,0.0,0.0
6
- Toto-2.0-22m,70.98765432098764,37.906655236674865,0.0,0.2300832338301921,0.0,0.0
7
- TiRex,68.82716049382715,37.758720587285445,0.0,0.16472977363175062,0.0,0.0
8
- Stat. Ensemble,64.50617283950618,38.177219528557146,0.0,73.43481351955408,0.0,0.0
9
- Chronos-2,63.271604938271594,36.558735189016225,0.0,0.14791438772454144,0.0,0.0
10
- Toto-1.0,58.95061728395062,33.97875884401389,0.0,5.0937543479594325,0.16666666666666666,0.0
11
- TimesFM-2.5,58.64197530864198,35.89256072267927,0.0,0.3095206282094962,0.16666666666666666,0.0
12
- TabPFN-TS,58.0246913580247,36.531743334435674,0.0,52.326198869129215,0.0,0.0
13
- FlowState,57.098765432098766,37.645403955852096,0.0,0.8205954025996205,0.16666666666666666,0.0
14
- CatBoost,55.24691358024691,35.20082715344605,3.42108969184492,0.03905346701454776,0.0,0.0
15
- Toto-2.0-4m,53.70370370370371,33.31225235226658,0.0,0.1810118077664009,0.0,0.0
16
- AutoETS,53.703703703703695,34.84116662551825,0.0,1.5253584038361796,0.0,0.0
17
- LightGBM,52.160493827160494,35.02206834104291,0.20454036927361854,0.03409663050126502,0.0,0.0
18
- AutoARIMA,48.76543209876543,35.732170334358024,0.0,6.5345976113161015,0.0,0.0
19
- Chronos-Bolt,45.37037037037037,30.478143266802604,0.0,0.1587546411616528,0.0,0.0
20
- TabPFN-TS-3,44.1358024691358,29.457560079978773,0.0,190.9822121554963,0.0,0.0
21
- Moirai-2.0,43.51851851851852,28.277512977220987,0.0,0.21986280235955058,0.16666666666666666,0.0
22
- Drift,41.66666666666666,28.435824921980835,0.0,0.4198026182352941,0.0,0.0
23
- AutoTheta,41.66666666666666,31.812923074763923,0.0,0.9578271612919038,0.0,0.0
24
- Naive,19.444444444444446,15.872310498117715,0.0,0.46331807906862743,0.0,0.0
25
- Sundial-Base,18.827160493827154,17.737235971841127,0.0,8.00438149490214,0.0,0.0
26
- PatchTST,17.59259259259259,15.619782622761335,310.3190003231231,0.1605401314516129,0.0,0.0
27
- DeepAR,17.59259259259259,19.60425306556468,546.7685936688092,0.18274403532732447,0.0,0.0
28
- TFT,15.432098765432098,6.946074243338563,445.02348117965687,0.18857640938013914,0.0,0.0
29
- Seasonal Naive,10.80246913580247,0.0,0.0,0.41450250024509805,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_econ/leaderboard_WQL.csv DELETED
@@ -1,29 +0,0 @@
1
- model_name,win_rate,skill_score,median_training_time_s_per100,median_inference_time_s_per100,training_corpus_overlap,num_failures
2
- TiRex-2,89.50617283950616,45.53906787899109,0.0,0.11294837920086495,0.0,0.0
3
- Toto-2.0-1B,81.17283950617283,42.35200647023204,0.0,2.4167769806179775,0.0,0.0
4
- Toto-2.0-2.5B,79.93827160493827,42.8032329067254,0.0,5.236902611304615,0.0,0.0
5
- Toto-2.0-313m,75.61728395061728,42.088190864136244,0.0,0.9865880503225806,0.0,0.0
6
- Toto-2.0-22m,75.0,42.320942130283335,0.0,0.2300832338301921,0.0,0.0
7
- TiRex,75.0,42.09146596586096,0.0,0.16472977363175062,0.0,0.0
8
- Chronos-2,70.06172839506173,40.960757337476025,0.0,0.14791438772454144,0.0,0.0
9
- FlowState,64.81481481481482,40.9054936267241,0.0,0.8205954025996205,0.16666666666666666,0.0
10
- TabPFN-TS,62.65432098765431,40.20371520247606,0.0,52.326198869129215,0.0,0.0
11
- Toto-1.0,62.34567901234568,38.100769058535434,0.0,5.0937543479594325,0.16666666666666666,0.0
12
- TimesFM-2.5,61.111111111111114,39.266493040907115,0.0,0.3095206282094962,0.16666666666666666,0.0
13
- Toto-2.0-4m,60.493827160493844,38.36462827294697,0.0,0.1810118077664009,0.0,0.0
14
- Stat. Ensemble,58.333333333333336,37.992090519620156,0.0,73.43481351955408,0.0,0.0
15
- Chronos-Bolt,52.77777777777777,35.534952430792764,0.0,0.1587546411616528,0.0,0.0
16
- AutoETS,52.160493827160494,36.76571988294681,0.0,1.5253584038361796,0.0,0.0
17
- TabPFN-TS-3,49.691358024691354,34.00880337940215,0.0,190.9822121554963,0.0,0.0
18
- Moirai-2.0,47.83950617283951,32.793225265991246,0.0,0.21986280235955058,0.16666666666666666,0.0
19
- AutoARIMA,46.60493827160494,34.44615311952015,0.0,6.5345976113161015,0.0,0.0
20
- AutoTheta,37.345679012345684,29.146207850323268,0.0,0.9578271612919038,0.0,0.0
21
- Drift,31.481481481481477,23.828649343246187,0.0,0.4198026182352941,0.0,0.0
22
- LightGBM,26.851851851851844,25.89068156049532,0.20454036927361854,0.03409663050126502,0.0,0.0
23
- CatBoost,26.851851851851844,26.0945614678313,3.42108969184492,0.03905346701454776,0.0,0.0
24
- DeepAR,26.234567901234566,21.869167576579297,546.7685936688092,0.18274403532732447,0.0,0.0
25
- PatchTST,22.8395061728395,19.911167839333967,310.3190003231231,0.1605401314516129,0.0,0.0
26
- Sundial-Base,18.827160493827154,17.532849869365606,0.0,8.00438149490214,0.0,0.0
27
- TFT,16.666666666666664,9.939963215759995,445.02348117965687,0.18857640938013914,0.0,0.0
28
- Naive,16.358024691358022,11.371958531244664,0.0,0.46331807906862743,0.0,0.0
29
- Seasonal Naive,11.419753086419755,0.0,0.0,0.41450250024509805,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_econ/pairwise_MASE.csv DELETED
@@ -1,290 +0,0 @@
1
- model_1,model_2,win_rate,win_rate_lower,win_rate_upper,skill_score,skill_score_lower,skill_score_upper
2
- TiRex-2,TiRex-2,0.5,0.5,0.5,0.0,0.0,0.0
3
- TiRex-2,Stat. Ensemble,0.583,0.25,0.833,0.034,-0.011,0.076
4
- TiRex-2,Toto-2.0-22m,0.75,0.5,0.917,0.043,0.018,0.069
5
- TiRex-2,Toto-2.0-1B,0.833,0.583,1.0,0.047,0.018,0.074
6
- TiRex-2,Toto-2.0-313m,0.833,0.583,1.0,0.047,0.02,0.07
7
- TiRex-2,Toto-2.0-2.5B,0.833,0.583,1.0,0.047,0.015,0.075
8
- TiRex-2,Chronos-2,0.833,0.583,1.0,0.067,0.014,0.124
9
- TiRex-2,TiRex,1.0,1.0,1.0,0.058,0.032,0.092
10
- TiRex-2,LightGBM,0.917,0.75,1.0,0.06,0.015,0.103
11
- TiRex-2,AutoETS,0.917,0.75,1.0,0.072,0.036,0.112
12
- TiRex-2,FlowState,0.833,0.583,1.0,0.082,0.013,0.144
13
- TiRex-2,CatBoost,0.833,0.583,1.0,0.071,0.024,0.117
14
- TiRex-2,Toto-1.0,0.833,0.583,1.0,0.12,0.051,0.194
15
- TiRex-2,Toto-2.0-4m,0.917,0.75,1.0,0.083,0.049,0.122
16
- TiRex-2,AutoARIMA,0.917,0.75,1.0,0.101,0.036,0.173
17
- TiRex-2,Chronos-Bolt,1.0,1.0,1.0,0.149,0.095,0.205
18
- TiRex-2,Seasonal Naive,1.0,1.0,1.0,0.406,0.298,0.505
19
- Stat. Ensemble,TiRex-2,0.417,0.167,0.75,-0.035,-0.083,0.011
20
- Stat. Ensemble,Stat. Ensemble,0.5,0.5,0.5,0.0,0.0,0.0
21
- Stat. Ensemble,Toto-2.0-22m,0.5,0.248,0.75,0.01,-0.034,0.052
22
- Stat. Ensemble,Toto-2.0-1B,0.5,0.25,0.75,0.013,-0.041,0.068
23
- Stat. Ensemble,Toto-2.0-313m,0.583,0.25,0.833,0.013,-0.039,0.064
24
- Stat. Ensemble,Toto-2.0-2.5B,0.667,0.417,0.917,0.013,-0.041,0.064
25
- Stat. Ensemble,Chronos-2,0.75,0.5,1.0,0.034,-0.014,0.087
26
- Stat. Ensemble,TiRex,0.75,0.5,1.0,0.025,-0.023,0.072
27
- Stat. Ensemble,LightGBM,0.75,0.5,1.0,0.027,-0.0,0.06
28
- Stat. Ensemble,AutoETS,0.75,0.5,1.0,0.04,0.016,0.067
29
- Stat. Ensemble,FlowState,0.667,0.417,0.917,0.05,-0.001,0.104
30
- Stat. Ensemble,CatBoost,0.75,0.5,1.0,0.039,0.005,0.073
31
- Stat. Ensemble,Toto-1.0,0.75,0.417,1.0,0.09,0.024,0.151
32
- Stat. Ensemble,Toto-2.0-4m,0.667,0.333,0.917,0.051,0.007,0.097
33
- Stat. Ensemble,AutoARIMA,0.833,0.583,1.0,0.069,0.021,0.135
34
- Stat. Ensemble,Chronos-Bolt,0.917,0.75,1.0,0.119,0.068,0.168
35
- Stat. Ensemble,Seasonal Naive,1.0,1.0,1.0,0.385,0.289,0.476
36
- Toto-2.0-22m,TiRex-2,0.25,0.083,0.5,-0.045,-0.074,-0.018
37
- Toto-2.0-22m,Stat. Ensemble,0.5,0.25,0.752,-0.01,-0.055,0.033
38
- Toto-2.0-22m,Toto-2.0-22m,0.5,0.5,0.5,0.0,0.0,0.0
39
- Toto-2.0-22m,Toto-2.0-1B,0.417,0.167,0.667,0.004,-0.028,0.04
40
- Toto-2.0-22m,Toto-2.0-313m,0.583,0.333,0.833,0.004,-0.023,0.031
41
- Toto-2.0-22m,Toto-2.0-2.5B,0.583,0.333,0.833,0.004,-0.029,0.034
42
- Toto-2.0-22m,Chronos-2,0.583,0.25,0.833,0.025,-0.041,0.081
43
- Toto-2.0-22m,TiRex,0.583,0.25,0.833,0.016,-0.02,0.048
44
- Toto-2.0-22m,LightGBM,0.667,0.417,0.917,0.018,-0.021,0.053
45
- Toto-2.0-22m,AutoETS,0.667,0.333,0.917,0.031,-0.008,0.068
46
- Toto-2.0-22m,FlowState,0.667,0.417,0.917,0.041,-0.025,0.105
47
- Toto-2.0-22m,CatBoost,0.667,0.417,0.917,0.03,-0.012,0.069
48
- Toto-2.0-22m,Toto-1.0,0.75,0.5,1.0,0.081,0.012,0.155
49
- Toto-2.0-22m,Toto-2.0-4m,1.0,1.0,1.0,0.042,0.025,0.061
50
- Toto-2.0-22m,AutoARIMA,0.667,0.417,0.917,0.06,-0.015,0.145
51
- Toto-2.0-22m,Chronos-Bolt,1.0,1.0,1.0,0.111,0.063,0.16
52
- Toto-2.0-22m,Seasonal Naive,1.0,1.0,1.0,0.379,0.266,0.482
53
- Toto-2.0-1B,TiRex-2,0.167,0.0,0.417,-0.049,-0.08,-0.018
54
- Toto-2.0-1B,Stat. Ensemble,0.5,0.25,0.75,-0.013,-0.073,0.039
55
- Toto-2.0-1B,Toto-2.0-22m,0.583,0.333,0.833,-0.004,-0.041,0.028
56
- Toto-2.0-1B,Toto-2.0-1B,0.5,0.5,0.5,0.0,0.0,0.0
57
- Toto-2.0-1B,Toto-2.0-313m,0.667,0.417,0.917,0.0,-0.011,0.011
58
- Toto-2.0-1B,Toto-2.0-2.5B,0.583,0.333,0.833,-0.0,-0.013,0.013
59
- Toto-2.0-1B,Chronos-2,0.5,0.25,0.752,0.021,-0.027,0.076
60
- Toto-2.0-1B,TiRex,0.667,0.417,0.917,0.012,-0.019,0.044
61
- Toto-2.0-1B,LightGBM,0.583,0.333,0.833,0.014,-0.046,0.063
62
- Toto-2.0-1B,AutoETS,0.667,0.417,0.917,0.027,-0.016,0.071
63
- Toto-2.0-1B,FlowState,0.667,0.417,0.917,0.038,-0.045,0.096
64
- Toto-2.0-1B,CatBoost,0.75,0.5,1.0,0.026,-0.035,0.074
65
- Toto-2.0-1B,Toto-1.0,0.583,0.25,0.833,0.077,0.011,0.152
66
- Toto-2.0-1B,Toto-2.0-4m,0.833,0.583,1.0,0.038,-0.006,0.081
67
- Toto-2.0-1B,AutoARIMA,0.833,0.583,1.0,0.057,-0.021,0.126
68
- Toto-2.0-1B,Chronos-Bolt,0.833,0.583,1.0,0.108,0.058,0.154
69
- Toto-2.0-1B,Seasonal Naive,0.917,0.75,1.0,0.376,0.262,0.473
70
- Toto-2.0-313m,TiRex-2,0.167,0.0,0.417,-0.049,-0.076,-0.021
71
- Toto-2.0-313m,Stat. Ensemble,0.417,0.167,0.75,-0.014,-0.068,0.037
72
- Toto-2.0-313m,Toto-2.0-22m,0.417,0.167,0.667,-0.004,-0.032,0.023
73
- Toto-2.0-313m,Toto-2.0-1B,0.333,0.083,0.583,-0.0,-0.011,0.011
74
- Toto-2.0-313m,Toto-2.0-313m,0.5,0.5,0.5,0.0,0.0,0.0
75
- Toto-2.0-313m,Toto-2.0-2.5B,0.5,0.25,0.75,-0.0,-0.009,0.01
76
- Toto-2.0-313m,Chronos-2,0.417,0.167,0.75,0.021,-0.03,0.075
77
- Toto-2.0-313m,TiRex,0.583,0.333,0.833,0.012,-0.013,0.041
78
- Toto-2.0-313m,LightGBM,0.667,0.417,0.917,0.014,-0.041,0.063
79
- Toto-2.0-313m,AutoETS,0.5,0.25,0.752,0.027,-0.011,0.069
80
- Toto-2.0-313m,FlowState,0.667,0.417,0.917,0.037,-0.043,0.1
81
- Toto-2.0-313m,CatBoost,0.667,0.417,0.917,0.026,-0.03,0.075
82
- Toto-2.0-313m,Toto-1.0,0.583,0.25,0.833,0.077,0.006,0.155
83
- Toto-2.0-313m,Toto-2.0-4m,0.667,0.417,0.917,0.038,0.001,0.08
84
- Toto-2.0-313m,AutoARIMA,0.75,0.5,1.0,0.057,-0.022,0.132
85
- Toto-2.0-313m,Chronos-Bolt,0.917,0.75,1.0,0.107,0.058,0.157
86
- Toto-2.0-313m,Seasonal Naive,1.0,1.0,1.0,0.376,0.262,0.475
87
- Toto-2.0-2.5B,TiRex-2,0.167,0.0,0.417,-0.049,-0.082,-0.015
88
- Toto-2.0-2.5B,Stat. Ensemble,0.333,0.083,0.583,-0.013,-0.068,0.039
89
- Toto-2.0-2.5B,Toto-2.0-22m,0.417,0.167,0.667,-0.004,-0.035,0.028
90
- Toto-2.0-2.5B,Toto-2.0-1B,0.417,0.167,0.667,0.0,-0.014,0.013
91
- Toto-2.0-2.5B,Toto-2.0-313m,0.5,0.25,0.75,0.0,-0.01,0.009
92
- Toto-2.0-2.5B,Toto-2.0-2.5B,0.5,0.5,0.5,0.0,0.0,0.0
93
- Toto-2.0-2.5B,Chronos-2,0.417,0.167,0.75,0.021,-0.024,0.072
94
- Toto-2.0-2.5B,TiRex,0.583,0.333,0.833,0.012,-0.011,0.037
95
- Toto-2.0-2.5B,LightGBM,0.667,0.417,0.917,0.014,-0.043,0.067
96
- Toto-2.0-2.5B,AutoETS,0.583,0.333,0.833,0.027,-0.011,0.068
97
- Toto-2.0-2.5B,FlowState,0.667,0.417,0.917,0.038,-0.043,0.103
98
- Toto-2.0-2.5B,CatBoost,0.667,0.417,0.917,0.026,-0.033,0.076
99
- Toto-2.0-2.5B,Toto-1.0,0.583,0.25,0.833,0.077,0.001,0.158
100
- Toto-2.0-2.5B,Toto-2.0-4m,0.667,0.417,0.917,0.038,-0.002,0.085
101
- Toto-2.0-2.5B,AutoARIMA,0.75,0.5,1.0,0.057,-0.023,0.135
102
- Toto-2.0-2.5B,Chronos-Bolt,0.917,0.75,1.0,0.108,0.058,0.156
103
- Toto-2.0-2.5B,Seasonal Naive,0.917,0.75,1.0,0.376,0.263,0.471
104
- Chronos-2,TiRex-2,0.167,0.0,0.417,-0.071,-0.141,-0.014
105
- Chronos-2,Stat. Ensemble,0.25,0.0,0.5,-0.035,-0.095,0.014
106
- Chronos-2,Toto-2.0-22m,0.417,0.167,0.75,-0.025,-0.088,0.039
107
- Chronos-2,Toto-2.0-1B,0.5,0.248,0.75,-0.022,-0.082,0.027
108
- Chronos-2,Toto-2.0-313m,0.583,0.25,0.833,-0.021,-0.081,0.029
109
- Chronos-2,Toto-2.0-2.5B,0.583,0.25,0.833,-0.022,-0.077,0.024
110
- Chronos-2,Chronos-2,0.5,0.5,0.5,0.0,0.0,0.0
111
- Chronos-2,TiRex,0.417,0.167,0.667,-0.009,-0.045,0.026
112
- Chronos-2,LightGBM,0.5,0.25,0.75,-0.007,-0.068,0.055
113
- Chronos-2,AutoETS,0.5,0.25,0.75,0.006,-0.027,0.041
114
- Chronos-2,FlowState,0.5,0.25,0.75,0.017,-0.064,0.092
115
- Chronos-2,CatBoost,0.583,0.333,0.833,0.005,-0.055,0.067
116
- Chronos-2,Toto-1.0,0.583,0.333,0.833,0.058,-0.037,0.145
117
- Chronos-2,Toto-2.0-4m,0.583,0.333,0.833,0.017,-0.054,0.091
118
- Chronos-2,AutoARIMA,0.667,0.417,0.917,0.037,-0.046,0.122
119
- Chronos-2,Chronos-Bolt,1.0,1.0,1.0,0.088,0.044,0.143
120
- Chronos-2,Seasonal Naive,1.0,1.0,1.0,0.363,0.264,0.451
121
- TiRex,TiRex-2,0.0,0.0,0.0,-0.062,-0.101,-0.033
122
- TiRex,Stat. Ensemble,0.25,0.0,0.5,-0.026,-0.078,0.023
123
- TiRex,Toto-2.0-22m,0.417,0.167,0.75,-0.016,-0.051,0.019
124
- TiRex,Toto-2.0-1B,0.333,0.083,0.583,-0.012,-0.046,0.018
125
- TiRex,Toto-2.0-313m,0.417,0.167,0.667,-0.012,-0.043,0.012
126
- TiRex,Toto-2.0-2.5B,0.417,0.167,0.667,-0.012,-0.038,0.011
127
- TiRex,Chronos-2,0.583,0.333,0.833,0.009,-0.026,0.043
128
- TiRex,TiRex,0.5,0.5,0.5,0.0,0.0,0.0
129
- TiRex,LightGBM,0.5,0.25,0.75,0.002,-0.051,0.049
130
- TiRex,AutoETS,0.5,0.25,0.75,0.015,-0.013,0.045
131
- TiRex,FlowState,0.583,0.333,0.833,0.026,-0.05,0.091
132
- TiRex,CatBoost,0.75,0.5,1.0,0.014,-0.041,0.062
133
- TiRex,Toto-1.0,0.583,0.333,0.833,0.066,-0.019,0.149
134
- TiRex,Toto-2.0-4m,0.583,0.333,0.833,0.026,-0.02,0.076
135
- TiRex,AutoARIMA,0.667,0.417,0.917,0.045,-0.033,0.133
136
- TiRex,Chronos-Bolt,0.917,0.75,1.0,0.097,0.05,0.149
137
- TiRex,Seasonal Naive,1.0,1.0,1.0,0.369,0.261,0.466
138
- LightGBM,TiRex-2,0.083,0.0,0.25,-0.064,-0.114,-0.016
139
- LightGBM,Stat. Ensemble,0.25,0.0,0.5,-0.028,-0.064,0.0
140
- LightGBM,Toto-2.0-22m,0.333,0.083,0.583,-0.018,-0.056,0.02
141
- LightGBM,Toto-2.0-1B,0.417,0.167,0.667,-0.015,-0.068,0.044
142
- LightGBM,Toto-2.0-313m,0.333,0.083,0.583,-0.014,-0.067,0.04
143
- LightGBM,Toto-2.0-2.5B,0.333,0.083,0.583,-0.015,-0.072,0.042
144
- LightGBM,Chronos-2,0.5,0.25,0.75,0.007,-0.059,0.064
145
- LightGBM,TiRex,0.5,0.25,0.75,-0.002,-0.051,0.049
146
- LightGBM,LightGBM,0.5,0.5,0.5,0.0,0.0,0.0
147
- LightGBM,AutoETS,0.667,0.417,0.917,0.013,-0.03,0.049
148
- LightGBM,FlowState,0.5,0.25,0.75,0.024,-0.019,0.072
149
- LightGBM,CatBoost,0.75,0.5,1.0,0.012,-0.002,0.026
150
- LightGBM,Toto-1.0,0.667,0.333,0.917,0.064,-0.009,0.132
151
- LightGBM,Toto-2.0-4m,0.5,0.25,0.75,0.024,-0.016,0.063
152
- LightGBM,AutoARIMA,0.5,0.25,0.75,0.043,-0.012,0.11
153
- LightGBM,Chronos-Bolt,0.917,0.75,1.0,0.095,0.053,0.136
154
- LightGBM,Seasonal Naive,1.0,1.0,1.0,0.367,0.267,0.458
155
- AutoETS,TiRex-2,0.083,0.0,0.25,-0.078,-0.126,-0.037
156
- AutoETS,Stat. Ensemble,0.25,0.0,0.5,-0.042,-0.072,-0.016
157
- AutoETS,Toto-2.0-22m,0.333,0.083,0.667,-0.032,-0.073,0.008
158
- AutoETS,Toto-2.0-1B,0.333,0.083,0.583,-0.028,-0.076,0.015
159
- AutoETS,Toto-2.0-313m,0.5,0.248,0.75,-0.028,-0.074,0.011
160
- AutoETS,Toto-2.0-2.5B,0.417,0.167,0.667,-0.028,-0.073,0.011
161
- AutoETS,Chronos-2,0.5,0.25,0.75,-0.006,-0.043,0.026
162
- AutoETS,TiRex,0.5,0.25,0.75,-0.015,-0.047,0.013
163
- AutoETS,LightGBM,0.333,0.083,0.583,-0.013,-0.052,0.029
164
- AutoETS,AutoETS,0.5,0.5,0.5,0.0,0.0,0.0
165
- AutoETS,FlowState,0.583,0.333,0.833,0.011,-0.051,0.077
166
- AutoETS,CatBoost,0.417,0.167,0.667,-0.001,-0.04,0.039
167
- AutoETS,Toto-1.0,0.583,0.333,0.833,0.052,-0.025,0.122
168
- AutoETS,Toto-2.0-4m,0.583,0.25,0.833,0.011,-0.035,0.059
169
- AutoETS,AutoARIMA,0.667,0.417,0.917,0.03,-0.036,0.112
170
- AutoETS,Chronos-Bolt,0.833,0.583,1.0,0.083,0.041,0.127
171
- AutoETS,Seasonal Naive,1.0,1.0,1.0,0.359,0.256,0.456
172
- FlowState,TiRex-2,0.167,0.0,0.417,-0.09,-0.168,-0.013
173
- FlowState,Stat. Ensemble,0.333,0.083,0.583,-0.053,-0.117,0.001
174
- FlowState,Toto-2.0-22m,0.333,0.083,0.583,-0.043,-0.117,0.025
175
- FlowState,Toto-2.0-1B,0.333,0.083,0.583,-0.039,-0.107,0.043
176
- FlowState,Toto-2.0-313m,0.333,0.083,0.583,-0.039,-0.112,0.041
177
- FlowState,Toto-2.0-2.5B,0.333,0.083,0.583,-0.039,-0.114,0.041
178
- FlowState,Chronos-2,0.5,0.25,0.75,-0.017,-0.102,0.06
179
- FlowState,TiRex,0.417,0.167,0.667,-0.026,-0.1,0.048
180
- FlowState,LightGBM,0.5,0.25,0.75,-0.024,-0.077,0.019
181
- FlowState,AutoETS,0.417,0.167,0.667,-0.011,-0.083,0.049
182
- FlowState,FlowState,0.5,0.5,0.5,0.0,0.0,0.0
183
- FlowState,CatBoost,0.667,0.417,0.917,-0.012,-0.06,0.028
184
- FlowState,Toto-1.0,0.583,0.292,0.833,0.041,-0.047,0.127
185
- FlowState,Toto-2.0-4m,0.5,0.25,0.75,0.001,-0.075,0.068
186
- FlowState,AutoARIMA,0.583,0.333,0.833,0.02,-0.017,0.055
187
- FlowState,Chronos-Bolt,0.833,0.625,1.0,0.073,0.02,0.125
188
- FlowState,Seasonal Naive,1.0,1.0,1.0,0.352,0.265,0.429
189
- CatBoost,TiRex-2,0.167,0.0,0.417,-0.077,-0.133,-0.024
190
- CatBoost,Stat. Ensemble,0.25,0.0,0.5,-0.041,-0.078,-0.005
191
- CatBoost,Toto-2.0-22m,0.333,0.083,0.583,-0.031,-0.074,0.012
192
- CatBoost,Toto-2.0-1B,0.25,0.0,0.5,-0.027,-0.08,0.034
193
- CatBoost,Toto-2.0-313m,0.333,0.083,0.583,-0.027,-0.081,0.029
194
- CatBoost,Toto-2.0-2.5B,0.333,0.083,0.583,-0.027,-0.083,0.032
195
- CatBoost,Chronos-2,0.417,0.167,0.667,-0.005,-0.071,0.052
196
- CatBoost,TiRex,0.25,0.0,0.5,-0.014,-0.066,0.039
197
- CatBoost,LightGBM,0.25,0.0,0.5,-0.012,-0.026,0.002
198
- CatBoost,AutoETS,0.583,0.333,0.833,0.001,-0.041,0.039
199
- CatBoost,FlowState,0.333,0.083,0.583,0.012,-0.029,0.057
200
- CatBoost,CatBoost,0.5,0.5,0.5,0.0,0.0,0.0
201
- CatBoost,Toto-1.0,0.667,0.333,0.917,0.053,-0.022,0.121
202
- CatBoost,Toto-2.0-4m,0.5,0.25,0.75,0.012,-0.033,0.054
203
- CatBoost,AutoARIMA,0.583,0.25,0.833,0.032,-0.023,0.093
204
- CatBoost,Chronos-Bolt,0.917,0.75,1.0,0.084,0.046,0.12
205
- CatBoost,Seasonal Naive,1.0,1.0,1.0,0.36,0.26,0.448
206
- Toto-1.0,TiRex-2,0.167,0.0,0.417,-0.137,-0.24,-0.054
207
- Toto-1.0,Stat. Ensemble,0.25,0.0,0.583,-0.099,-0.177,-0.024
208
- Toto-1.0,Toto-2.0-22m,0.25,0.0,0.5,-0.088,-0.183,-0.012
209
- Toto-1.0,Toto-2.0-1B,0.417,0.167,0.75,-0.084,-0.179,-0.012
210
- Toto-1.0,Toto-2.0-313m,0.417,0.167,0.75,-0.084,-0.184,-0.006
211
- Toto-1.0,Toto-2.0-2.5B,0.417,0.167,0.75,-0.084,-0.188,-0.001
212
- Toto-1.0,Chronos-2,0.417,0.167,0.667,-0.061,-0.169,0.035
213
- Toto-1.0,TiRex,0.417,0.167,0.667,-0.071,-0.175,0.019
214
- Toto-1.0,LightGBM,0.333,0.083,0.667,-0.068,-0.152,0.009
215
- Toto-1.0,AutoETS,0.417,0.167,0.667,-0.055,-0.139,0.025
216
- Toto-1.0,FlowState,0.417,0.167,0.708,-0.043,-0.146,0.045
217
- Toto-1.0,CatBoost,0.333,0.083,0.667,-0.056,-0.138,0.021
218
- Toto-1.0,Toto-1.0,0.5,0.5,0.5,0.0,0.0,0.0
219
- Toto-1.0,Toto-2.0-4m,0.583,0.333,0.833,-0.043,-0.126,0.025
220
- Toto-1.0,AutoARIMA,0.583,0.333,0.833,-0.022,-0.108,0.05
221
- Toto-1.0,Chronos-Bolt,0.75,0.5,0.958,0.033,-0.034,0.097
222
- Toto-1.0,Seasonal Naive,0.917,0.75,1.0,0.324,0.198,0.433
223
- Toto-2.0-4m,TiRex-2,0.083,0.0,0.25,-0.09,-0.139,-0.051
224
- Toto-2.0-4m,Stat. Ensemble,0.333,0.083,0.667,-0.054,-0.108,-0.007
225
- Toto-2.0-4m,Toto-2.0-22m,0.0,0.0,0.0,-0.044,-0.065,-0.026
226
- Toto-2.0-4m,Toto-2.0-1B,0.167,0.0,0.417,-0.04,-0.088,0.006
227
- Toto-2.0-4m,Toto-2.0-313m,0.333,0.083,0.583,-0.039,-0.087,-0.001
228
- Toto-2.0-4m,Toto-2.0-2.5B,0.333,0.083,0.583,-0.04,-0.093,0.002
229
- Toto-2.0-4m,Chronos-2,0.417,0.167,0.667,-0.018,-0.1,0.051
230
- Toto-2.0-4m,TiRex,0.417,0.167,0.667,-0.027,-0.082,0.019
231
- Toto-2.0-4m,LightGBM,0.5,0.25,0.75,-0.025,-0.068,0.016
232
- Toto-2.0-4m,AutoETS,0.417,0.167,0.75,-0.011,-0.063,0.034
233
- Toto-2.0-4m,FlowState,0.5,0.25,0.75,-0.001,-0.073,0.07
234
- Toto-2.0-4m,CatBoost,0.5,0.25,0.75,-0.013,-0.057,0.032
235
- Toto-2.0-4m,Toto-1.0,0.417,0.167,0.667,0.041,-0.025,0.112
236
- Toto-2.0-4m,Toto-2.0-4m,0.5,0.5,0.5,0.0,0.0,0.0
237
- Toto-2.0-4m,AutoARIMA,0.5,0.25,0.75,0.019,-0.063,0.108
238
- Toto-2.0-4m,Chronos-Bolt,0.667,0.417,0.917,0.072,0.02,0.128
239
- Toto-2.0-4m,Seasonal Naive,0.917,0.75,1.0,0.352,0.226,0.462
240
- AutoARIMA,TiRex-2,0.083,0.0,0.25,-0.112,-0.209,-0.037
241
- AutoARIMA,Stat. Ensemble,0.167,0.0,0.417,-0.074,-0.156,-0.022
242
- AutoARIMA,Toto-2.0-22m,0.333,0.083,0.583,-0.064,-0.169,0.015
243
- AutoARIMA,Toto-2.0-1B,0.167,0.0,0.417,-0.06,-0.145,0.02
244
- AutoARIMA,Toto-2.0-313m,0.25,0.0,0.5,-0.06,-0.152,0.021
245
- AutoARIMA,Toto-2.0-2.5B,0.25,0.0,0.5,-0.06,-0.156,0.022
246
- AutoARIMA,Chronos-2,0.333,0.083,0.583,-0.038,-0.139,0.044
247
- AutoARIMA,TiRex,0.333,0.083,0.583,-0.047,-0.154,0.032
248
- AutoARIMA,LightGBM,0.5,0.25,0.75,-0.045,-0.124,0.012
249
- AutoARIMA,AutoETS,0.333,0.083,0.583,-0.031,-0.126,0.035
250
- AutoARIMA,FlowState,0.417,0.167,0.667,-0.02,-0.058,0.017
251
- AutoARIMA,CatBoost,0.417,0.167,0.75,-0.033,-0.102,0.023
252
- AutoARIMA,Toto-1.0,0.417,0.167,0.667,0.022,-0.052,0.097
253
- AutoARIMA,Toto-2.0-4m,0.5,0.25,0.75,-0.02,-0.121,0.059
254
- AutoARIMA,AutoARIMA,0.5,0.5,0.5,0.0,0.0,0.0
255
- AutoARIMA,Chronos-Bolt,0.667,0.417,0.917,0.054,-0.009,0.113
256
- AutoARIMA,Seasonal Naive,1.0,1.0,1.0,0.339,0.256,0.422
257
- Chronos-Bolt,TiRex-2,0.0,0.0,0.0,-0.175,-0.258,-0.106
258
- Chronos-Bolt,Stat. Ensemble,0.083,0.0,0.25,-0.136,-0.202,-0.073
259
- Chronos-Bolt,Toto-2.0-22m,0.0,0.0,0.0,-0.125,-0.191,-0.068
260
- Chronos-Bolt,Toto-2.0-1B,0.167,0.0,0.417,-0.121,-0.182,-0.062
261
- Chronos-Bolt,Toto-2.0-313m,0.083,0.0,0.25,-0.12,-0.186,-0.062
262
- Chronos-Bolt,Toto-2.0-2.5B,0.083,0.0,0.25,-0.121,-0.185,-0.061
263
- Chronos-Bolt,Chronos-2,0.0,0.0,0.0,-0.097,-0.167,-0.046
264
- Chronos-Bolt,TiRex,0.083,0.0,0.25,-0.107,-0.175,-0.053
265
- Chronos-Bolt,LightGBM,0.083,0.0,0.25,-0.104,-0.157,-0.056
266
- Chronos-Bolt,AutoETS,0.167,0.0,0.417,-0.09,-0.145,-0.043
267
- Chronos-Bolt,FlowState,0.167,0.0,0.375,-0.078,-0.143,-0.02
268
- Chronos-Bolt,CatBoost,0.083,0.0,0.25,-0.091,-0.136,-0.049
269
- Chronos-Bolt,Toto-1.0,0.25,0.042,0.5,-0.034,-0.107,0.033
270
- Chronos-Bolt,Toto-2.0-4m,0.333,0.083,0.583,-0.078,-0.146,-0.021
271
- Chronos-Bolt,AutoARIMA,0.333,0.083,0.583,-0.057,-0.128,0.009
272
- Chronos-Bolt,Chronos-Bolt,0.5,0.5,0.5,0.0,0.0,0.0
273
- Chronos-Bolt,Seasonal Naive,0.833,0.583,1.0,0.301,0.198,0.389
274
- Seasonal Naive,TiRex-2,0.0,0.0,0.0,-0.682,-1.021,-0.425
275
- Seasonal Naive,Stat. Ensemble,0.0,0.0,0.0,-0.625,-0.907,-0.407
276
- Seasonal Naive,Toto-2.0-22m,0.0,0.0,0.0,-0.61,-0.932,-0.362
277
- Seasonal Naive,Toto-2.0-1B,0.083,0.0,0.25,-0.604,-0.897,-0.355
278
- Seasonal Naive,Toto-2.0-313m,0.0,0.0,0.0,-0.604,-0.904,-0.354
279
- Seasonal Naive,Toto-2.0-2.5B,0.083,0.0,0.25,-0.604,-0.891,-0.357
280
- Seasonal Naive,Chronos-2,0.0,0.0,0.0,-0.57,-0.821,-0.358
281
- Seasonal Naive,TiRex,0.0,0.0,0.0,-0.584,-0.872,-0.353
282
- Seasonal Naive,LightGBM,0.0,0.0,0.0,-0.581,-0.845,-0.364
283
- Seasonal Naive,AutoETS,0.0,0.0,0.0,-0.56,-0.837,-0.345
284
- Seasonal Naive,FlowState,0.0,0.0,0.0,-0.544,-0.752,-0.36
285
- Seasonal Naive,CatBoost,0.0,0.0,0.0,-0.562,-0.812,-0.352
286
- Seasonal Naive,Toto-1.0,0.083,0.0,0.25,-0.48,-0.763,-0.247
287
- Seasonal Naive,Toto-2.0-4m,0.083,0.0,0.25,-0.543,-0.858,-0.292
288
- Seasonal Naive,AutoARIMA,0.0,0.0,0.0,-0.513,-0.73,-0.344
289
- Seasonal Naive,Chronos-Bolt,0.167,0.0,0.417,-0.431,-0.638,-0.246
290
- Seasonal Naive,Seasonal Naive,0.5,0.5,0.5,0.0,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_econ/pairwise_SQL.csv DELETED
@@ -1,290 +0,0 @@
1
- model_1,model_2,win_rate,win_rate_lower,win_rate_upper,skill_score,skill_score_lower,skill_score_upper
2
- TiRex-2,TiRex-2,0.5,0.5,0.5,0.0,0.0,0.0
3
- TiRex-2,Toto-2.0-1B,0.833,0.583,1.0,0.05,0.019,0.077
4
- TiRex-2,TiRex,1.0,1.0,1.0,0.052,0.026,0.086
5
- TiRex-2,Toto-2.0-2.5B,0.833,0.583,1.0,0.046,0.014,0.077
6
- TiRex-2,Chronos-2,0.917,0.75,1.0,0.058,0.014,0.109
7
- TiRex-2,Toto-2.0-22m,0.75,0.5,0.917,0.05,0.023,0.079
8
- TiRex-2,Toto-2.0-313m,0.833,0.583,1.0,0.05,0.022,0.076
9
- TiRex-2,Stat. Ensemble,0.833,0.583,1.0,0.068,0.024,0.107
10
- TiRex-2,FlowState,0.833,0.583,1.0,0.094,0.027,0.152
11
- TiRex-2,Toto-2.0-4m,0.917,0.75,1.0,0.085,0.049,0.126
12
- TiRex-2,Toto-1.0,1.0,1.0,1.0,0.118,0.061,0.181
13
- TiRex-2,TabPFN-TS,0.833,0.583,1.0,0.096,0.05,0.138
14
- TiRex-2,AutoETS,1.0,1.0,1.0,0.172,0.075,0.301
15
- TiRex-2,AutoARIMA,0.917,0.75,1.0,0.141,0.074,0.215
16
- TiRex-2,TimesFM-2.5,0.917,0.75,1.0,0.128,0.08,0.174
17
- TiRex-2,Chronos-Bolt,1.0,1.0,1.0,0.14,0.09,0.195
18
- TiRex-2,Seasonal Naive,1.0,1.0,1.0,0.414,0.318,0.502
19
- Toto-2.0-1B,TiRex-2,0.167,0.0,0.417,-0.052,-0.083,-0.019
20
- Toto-2.0-1B,Toto-2.0-1B,0.5,0.5,0.5,0.0,0.0,0.0
21
- Toto-2.0-1B,TiRex,0.5,0.25,0.75,0.002,-0.025,0.032
22
- Toto-2.0-1B,Toto-2.0-2.5B,0.417,0.167,0.667,-0.004,-0.018,0.01
23
- Toto-2.0-1B,Chronos-2,0.417,0.167,0.75,0.009,-0.036,0.055
24
- Toto-2.0-1B,Toto-2.0-22m,0.5,0.167,0.75,0.0,-0.03,0.027
25
- Toto-2.0-1B,Toto-2.0-313m,0.583,0.333,0.833,0.0,-0.016,0.014
26
- Toto-2.0-1B,Stat. Ensemble,0.75,0.5,1.0,0.019,-0.04,0.068
27
- Toto-2.0-1B,FlowState,0.75,0.5,1.0,0.047,-0.032,0.1
28
- Toto-2.0-1B,Toto-2.0-4m,0.833,0.583,1.0,0.037,-0.006,0.08
29
- Toto-2.0-1B,Toto-1.0,0.75,0.5,1.0,0.072,0.013,0.134
30
- Toto-2.0-1B,TabPFN-TS,0.833,0.583,1.0,0.048,-0.007,0.097
31
- Toto-2.0-1B,AutoETS,0.75,0.5,1.0,0.129,0.018,0.268
32
- Toto-2.0-1B,AutoARIMA,0.833,0.583,1.0,0.096,0.016,0.174
33
- Toto-2.0-1B,TimesFM-2.5,0.917,0.75,1.0,0.082,0.045,0.115
34
- Toto-2.0-1B,Chronos-Bolt,0.833,0.583,1.0,0.095,0.048,0.139
35
- Toto-2.0-1B,Seasonal Naive,0.917,0.75,1.0,0.383,0.278,0.469
36
- TiRex,TiRex-2,0.0,0.0,0.0,-0.055,-0.094,-0.027
37
- TiRex,Toto-2.0-1B,0.5,0.25,0.75,-0.002,-0.033,0.024
38
- TiRex,TiRex,0.5,0.5,0.5,0.0,0.0,0.0
39
- TiRex,Toto-2.0-2.5B,0.5,0.25,0.75,-0.006,-0.031,0.017
40
- TiRex,Chronos-2,0.667,0.417,0.917,0.007,-0.028,0.036
41
- TiRex,Toto-2.0-22m,0.5,0.25,0.833,-0.002,-0.037,0.033
42
- TiRex,Toto-2.0-313m,0.417,0.167,0.667,-0.002,-0.03,0.024
43
- TiRex,Stat. Ensemble,0.75,0.5,1.0,0.017,-0.034,0.06
44
- TiRex,FlowState,0.833,0.583,1.0,0.045,-0.023,0.098
45
- TiRex,Toto-2.0-4m,0.667,0.415,0.917,0.035,-0.011,0.083
46
- TiRex,Toto-1.0,0.667,0.333,0.917,0.07,-0.008,0.143
47
- TiRex,TabPFN-TS,0.833,0.583,1.0,0.046,0.002,0.086
48
- TiRex,AutoETS,0.75,0.5,1.0,0.127,0.025,0.268
49
- TiRex,AutoARIMA,0.833,0.583,1.0,0.094,0.019,0.181
50
- TiRex,TimesFM-2.5,0.917,0.75,1.0,0.08,0.038,0.122
51
- TiRex,Chronos-Bolt,0.917,0.75,1.0,0.093,0.05,0.141
52
- TiRex,Seasonal Naive,1.0,1.0,1.0,0.382,0.282,0.467
53
- Toto-2.0-2.5B,TiRex-2,0.167,0.0,0.417,-0.048,-0.084,-0.015
54
- Toto-2.0-2.5B,Toto-2.0-1B,0.583,0.333,0.833,0.004,-0.011,0.018
55
- Toto-2.0-2.5B,TiRex,0.5,0.25,0.75,0.006,-0.017,0.03
56
- Toto-2.0-2.5B,Toto-2.0-2.5B,0.5,0.5,0.5,0.0,0.0,0.0
57
- Toto-2.0-2.5B,Chronos-2,0.417,0.167,0.75,0.013,-0.029,0.057
58
- Toto-2.0-2.5B,Toto-2.0-22m,0.583,0.25,0.833,0.004,-0.024,0.036
59
- Toto-2.0-2.5B,Toto-2.0-313m,0.583,0.331,0.833,0.004,-0.006,0.014
60
- Toto-2.0-2.5B,Stat. Ensemble,0.583,0.333,0.833,0.023,-0.033,0.071
61
- Toto-2.0-2.5B,FlowState,0.667,0.417,0.917,0.051,-0.024,0.108
62
- Toto-2.0-2.5B,Toto-2.0-4m,0.667,0.417,0.917,0.041,0.0,0.089
63
- Toto-2.0-2.5B,Toto-1.0,0.75,0.5,1.0,0.076,0.006,0.146
64
- Toto-2.0-2.5B,TabPFN-TS,0.75,0.5,1.0,0.052,0.005,0.095
65
- Toto-2.0-2.5B,AutoETS,0.833,0.583,1.0,0.132,0.027,0.27
66
- Toto-2.0-2.5B,AutoARIMA,0.833,0.583,1.0,0.1,0.018,0.186
67
- Toto-2.0-2.5B,TimesFM-2.5,0.917,0.75,1.0,0.086,0.05,0.122
68
- Toto-2.0-2.5B,Chronos-Bolt,0.917,0.75,1.0,0.099,0.05,0.146
69
- Toto-2.0-2.5B,Seasonal Naive,1.0,1.0,1.0,0.385,0.285,0.47
70
- Chronos-2,TiRex-2,0.083,0.0,0.25,-0.062,-0.123,-0.014
71
- Chronos-2,Toto-2.0-1B,0.583,0.25,0.833,-0.009,-0.059,0.035
72
- Chronos-2,TiRex,0.333,0.083,0.583,-0.007,-0.037,0.027
73
- Chronos-2,Toto-2.0-2.5B,0.583,0.25,0.833,-0.013,-0.06,0.028
74
- Chronos-2,Chronos-2,0.5,0.5,0.5,0.0,0.0,0.0
75
- Chronos-2,Toto-2.0-22m,0.5,0.167,0.833,-0.009,-0.065,0.049
76
- Chronos-2,Toto-2.0-313m,0.5,0.167,0.833,-0.009,-0.06,0.036
77
- Chronos-2,Stat. Ensemble,0.833,0.583,1.0,0.01,-0.042,0.051
78
- Chronos-2,FlowState,0.667,0.417,0.917,0.038,-0.034,0.106
79
- Chronos-2,Toto-2.0-4m,0.667,0.415,0.917,0.029,-0.035,0.098
80
- Chronos-2,Toto-1.0,0.667,0.333,0.917,0.064,-0.021,0.141
81
- Chronos-2,TabPFN-TS,0.75,0.5,1.0,0.04,0.005,0.072
82
- Chronos-2,AutoETS,0.75,0.5,1.0,0.121,0.02,0.261
83
- Chronos-2,AutoARIMA,0.75,0.5,1.0,0.088,0.009,0.174
84
- Chronos-2,TimesFM-2.5,0.917,0.75,1.0,0.074,0.039,0.111
85
- Chronos-2,Chronos-Bolt,1.0,1.0,1.0,0.087,0.043,0.142
86
- Chronos-2,Seasonal Naive,1.0,1.0,1.0,0.377,0.286,0.457
87
- Toto-2.0-22m,TiRex-2,0.25,0.083,0.5,-0.053,-0.086,-0.024
88
- Toto-2.0-22m,Toto-2.0-1B,0.5,0.25,0.833,-0.0,-0.028,0.029
89
- Toto-2.0-22m,TiRex,0.5,0.167,0.75,0.002,-0.034,0.036
90
- Toto-2.0-22m,Toto-2.0-2.5B,0.417,0.167,0.75,-0.004,-0.038,0.023
91
- Toto-2.0-22m,Chronos-2,0.5,0.167,0.833,0.009,-0.051,0.061
92
- Toto-2.0-22m,Toto-2.0-22m,0.5,0.5,0.5,0.0,0.0,0.0
93
- Toto-2.0-22m,Toto-2.0-313m,0.417,0.167,0.75,0.0,-0.025,0.023
94
- Toto-2.0-22m,Stat. Ensemble,0.667,0.417,0.917,0.019,-0.03,0.062
95
- Toto-2.0-22m,FlowState,0.583,0.333,0.833,0.046,-0.012,0.098
96
- Toto-2.0-22m,Toto-2.0-4m,0.833,0.583,1.0,0.037,0.019,0.057
97
- Toto-2.0-22m,Toto-1.0,0.667,0.417,0.917,0.072,0.016,0.131
98
- Toto-2.0-22m,TabPFN-TS,0.667,0.417,0.917,0.048,-0.011,0.096
99
- Toto-2.0-22m,AutoETS,0.833,0.583,1.0,0.128,0.025,0.268
100
- Toto-2.0-22m,AutoARIMA,0.75,0.5,1.0,0.096,0.021,0.181
101
- Toto-2.0-22m,TimesFM-2.5,0.917,0.75,1.0,0.082,0.025,0.13
102
- Toto-2.0-22m,Chronos-Bolt,1.0,1.0,1.0,0.095,0.055,0.138
103
- Toto-2.0-22m,Seasonal Naive,1.0,1.0,1.0,0.383,0.284,0.473
104
- Toto-2.0-313m,TiRex-2,0.167,0.0,0.417,-0.053,-0.082,-0.023
105
- Toto-2.0-313m,Toto-2.0-1B,0.417,0.167,0.667,-0.0,-0.015,0.015
106
- Toto-2.0-313m,TiRex,0.583,0.333,0.833,0.002,-0.025,0.029
107
- Toto-2.0-313m,Toto-2.0-2.5B,0.417,0.167,0.669,-0.004,-0.014,0.006
108
- Toto-2.0-313m,Chronos-2,0.5,0.167,0.833,0.009,-0.038,0.056
109
- Toto-2.0-313m,Toto-2.0-22m,0.583,0.25,0.833,-0.0,-0.024,0.024
110
- Toto-2.0-313m,Toto-2.0-313m,0.5,0.5,0.5,0.0,0.0,0.0
111
- Toto-2.0-313m,Stat. Ensemble,0.667,0.417,0.917,0.018,-0.031,0.064
112
- Toto-2.0-313m,FlowState,0.667,0.417,0.917,0.046,-0.02,0.099
113
- Toto-2.0-313m,Toto-2.0-4m,0.667,0.417,0.917,0.037,0.001,0.079
114
- Toto-2.0-313m,Toto-1.0,0.667,0.417,0.917,0.072,0.005,0.139
115
- Toto-2.0-313m,TabPFN-TS,0.75,0.5,1.0,0.048,0.0,0.09
116
- Toto-2.0-313m,AutoETS,0.75,0.5,1.0,0.128,0.025,0.267
117
- Toto-2.0-313m,AutoARIMA,0.833,0.583,1.0,0.096,0.02,0.177
118
- Toto-2.0-313m,TimesFM-2.5,0.917,0.75,1.0,0.082,0.041,0.12
119
- Toto-2.0-313m,Chronos-Bolt,0.917,0.75,1.0,0.095,0.047,0.142
120
- Toto-2.0-313m,Seasonal Naive,1.0,1.0,1.0,0.383,0.283,0.468
121
- Stat. Ensemble,TiRex-2,0.167,0.0,0.417,-0.073,-0.119,-0.024
122
- Stat. Ensemble,Toto-2.0-1B,0.25,0.0,0.5,-0.019,-0.072,0.039
123
- Stat. Ensemble,TiRex,0.25,0.0,0.5,-0.017,-0.064,0.033
124
- Stat. Ensemble,Toto-2.0-2.5B,0.417,0.167,0.667,-0.023,-0.076,0.032
125
- Stat. Ensemble,Chronos-2,0.167,0.0,0.417,-0.01,-0.053,0.04
126
- Stat. Ensemble,Toto-2.0-22m,0.333,0.083,0.583,-0.019,-0.066,0.029
127
- Stat. Ensemble,Toto-2.0-313m,0.333,0.083,0.583,-0.019,-0.069,0.03
128
- Stat. Ensemble,Stat. Ensemble,0.5,0.5,0.5,0.0,0.0,0.0
129
- Stat. Ensemble,FlowState,0.5,0.167,0.75,0.029,-0.016,0.073
130
- Stat. Ensemble,Toto-2.0-4m,0.417,0.167,0.667,0.019,-0.029,0.073
131
- Stat. Ensemble,Toto-1.0,0.667,0.333,0.917,0.054,-0.012,0.118
132
- Stat. Ensemble,TabPFN-TS,0.75,0.5,1.0,0.03,-0.01,0.063
133
- Stat. Ensemble,AutoETS,0.667,0.417,0.917,0.112,0.011,0.257
134
- Stat. Ensemble,AutoARIMA,0.833,0.583,1.0,0.079,0.03,0.146
135
- Stat. Ensemble,TimesFM-2.5,0.833,0.583,1.0,0.065,0.013,0.121
136
- Stat. Ensemble,Chronos-Bolt,0.917,0.75,1.0,0.078,0.024,0.131
137
- Stat. Ensemble,Seasonal Naive,1.0,1.0,1.0,0.371,0.288,0.452
138
- FlowState,TiRex-2,0.167,0.0,0.417,-0.104,-0.179,-0.028
139
- FlowState,Toto-2.0-1B,0.25,0.0,0.5,-0.049,-0.112,0.031
140
- FlowState,TiRex,0.167,0.0,0.417,-0.047,-0.109,0.023
141
- FlowState,Toto-2.0-2.5B,0.333,0.083,0.583,-0.053,-0.121,0.024
142
- FlowState,Chronos-2,0.333,0.083,0.583,-0.04,-0.118,0.033
143
- FlowState,Toto-2.0-22m,0.417,0.167,0.667,-0.049,-0.109,0.012
144
- FlowState,Toto-2.0-313m,0.333,0.083,0.583,-0.049,-0.109,0.02
145
- FlowState,Stat. Ensemble,0.5,0.25,0.833,-0.029,-0.079,0.016
146
- FlowState,FlowState,0.5,0.5,0.5,0.0,0.0,0.0
147
- FlowState,Toto-2.0-4m,0.5,0.25,0.75,-0.01,-0.079,0.052
148
- FlowState,Toto-1.0,0.583,0.292,0.833,0.027,-0.057,0.11
149
- FlowState,TabPFN-TS,0.583,0.333,0.833,0.002,-0.065,0.055
150
- FlowState,AutoETS,0.583,0.333,0.833,0.086,-0.042,0.243
151
- FlowState,AutoARIMA,0.75,0.5,1.0,0.052,0.005,0.102
152
- FlowState,TimesFM-2.5,0.667,0.417,0.875,0.037,-0.024,0.11
153
- FlowState,Chronos-Bolt,0.833,0.625,1.0,0.051,-0.002,0.101
154
- FlowState,Seasonal Naive,1.0,1.0,1.0,0.353,0.274,0.424
155
- Toto-2.0-4m,TiRex-2,0.083,0.0,0.25,-0.093,-0.144,-0.052
156
- Toto-2.0-4m,Toto-2.0-1B,0.167,0.0,0.417,-0.039,-0.087,0.006
157
- Toto-2.0-4m,TiRex,0.333,0.083,0.585,-0.037,-0.091,0.011
158
- Toto-2.0-4m,Toto-2.0-2.5B,0.333,0.083,0.583,-0.043,-0.097,-0.0
159
- Toto-2.0-4m,Chronos-2,0.333,0.083,0.585,-0.029,-0.108,0.034
160
- Toto-2.0-4m,Toto-2.0-22m,0.167,0.0,0.417,-0.039,-0.06,-0.019
161
- Toto-2.0-4m,Toto-2.0-313m,0.333,0.083,0.583,-0.038,-0.086,-0.001
162
- Toto-2.0-4m,Stat. Ensemble,0.583,0.333,0.833,-0.019,-0.079,0.028
163
- Toto-2.0-4m,FlowState,0.5,0.25,0.75,0.01,-0.055,0.073
164
- Toto-2.0-4m,Toto-2.0-4m,0.5,0.5,0.5,0.0,0.0,0.0
165
- Toto-2.0-4m,Toto-1.0,0.417,0.167,0.667,0.036,-0.022,0.097
166
- Toto-2.0-4m,TabPFN-TS,0.583,0.333,0.833,0.011,-0.067,0.07
167
- Toto-2.0-4m,AutoETS,0.75,0.5,1.0,0.095,-0.02,0.241
168
- Toto-2.0-4m,AutoARIMA,0.583,0.333,0.833,0.061,-0.023,0.155
169
- Toto-2.0-4m,TimesFM-2.5,0.667,0.417,0.917,0.047,-0.027,0.112
170
- Toto-2.0-4m,Chronos-Bolt,0.667,0.417,0.917,0.06,0.01,0.112
171
- Toto-2.0-4m,Seasonal Naive,0.917,0.75,1.0,0.359,0.246,0.458
172
- Toto-1.0,TiRex-2,0.0,0.0,0.0,-0.134,-0.221,-0.065
173
- Toto-1.0,Toto-2.0-1B,0.25,0.0,0.5,-0.078,-0.155,-0.013
174
- Toto-1.0,TiRex,0.333,0.083,0.667,-0.076,-0.167,0.008
175
- Toto-1.0,Toto-2.0-2.5B,0.25,0.0,0.5,-0.082,-0.171,-0.006
176
- Toto-1.0,Chronos-2,0.333,0.083,0.667,-0.068,-0.164,0.021
177
- Toto-1.0,Toto-2.0-22m,0.333,0.083,0.583,-0.078,-0.151,-0.017
178
- Toto-1.0,Toto-2.0-313m,0.333,0.083,0.583,-0.077,-0.162,-0.005
179
- Toto-1.0,Stat. Ensemble,0.333,0.083,0.667,-0.058,-0.134,0.012
180
- Toto-1.0,FlowState,0.417,0.167,0.708,-0.027,-0.124,0.054
181
- Toto-1.0,Toto-2.0-4m,0.583,0.333,0.833,-0.038,-0.107,0.022
182
- Toto-1.0,Toto-1.0,0.5,0.5,0.5,0.0,0.0,0.0
183
- Toto-1.0,TabPFN-TS,0.667,0.417,0.917,-0.026,-0.134,0.065
184
- Toto-1.0,AutoETS,0.5,0.25,0.752,0.061,-0.086,0.229
185
- Toto-1.0,AutoARIMA,0.667,0.417,0.917,0.026,-0.059,0.101
186
- Toto-1.0,TimesFM-2.5,0.75,0.5,0.958,0.011,-0.075,0.076
187
- Toto-1.0,Chronos-Bolt,0.667,0.417,0.875,0.025,-0.031,0.083
188
- Toto-1.0,Seasonal Naive,0.917,0.75,1.0,0.335,0.215,0.436
189
- TabPFN-TS,TiRex-2,0.167,0.0,0.417,-0.106,-0.16,-0.053
190
- TabPFN-TS,Toto-2.0-1B,0.167,0.0,0.417,-0.051,-0.107,0.007
191
- TabPFN-TS,TiRex,0.167,0.0,0.417,-0.048,-0.094,-0.002
192
- TabPFN-TS,Toto-2.0-2.5B,0.25,0.0,0.5,-0.055,-0.105,-0.005
193
- TabPFN-TS,Chronos-2,0.25,0.0,0.5,-0.041,-0.077,-0.005
194
- TabPFN-TS,Toto-2.0-22m,0.333,0.083,0.583,-0.05,-0.106,0.011
195
- TabPFN-TS,Toto-2.0-313m,0.25,0.0,0.5,-0.05,-0.099,-0.0
196
- TabPFN-TS,Stat. Ensemble,0.25,0.0,0.5,-0.031,-0.067,0.009
197
- TabPFN-TS,FlowState,0.417,0.167,0.667,-0.002,-0.058,0.061
198
- TabPFN-TS,Toto-2.0-4m,0.417,0.167,0.667,-0.011,-0.075,0.062
199
- TabPFN-TS,Toto-1.0,0.333,0.083,0.583,0.025,-0.069,0.118
200
- TabPFN-TS,TabPFN-TS,0.5,0.5,0.5,0.0,0.0,0.0
201
- TabPFN-TS,AutoETS,0.5,0.167,0.75,0.085,-0.026,0.234
202
- TabPFN-TS,AutoARIMA,0.667,0.415,0.917,0.051,-0.02,0.134
203
- TabPFN-TS,TimesFM-2.5,0.583,0.333,0.833,0.036,-0.012,0.086
204
- TabPFN-TS,Chronos-Bolt,0.5,0.25,0.75,0.049,-0.015,0.114
205
- TabPFN-TS,Seasonal Naive,1.0,1.0,1.0,0.352,0.266,0.435
206
- AutoETS,TiRex-2,0.0,0.0,0.0,-0.208,-0.431,-0.081
207
- AutoETS,Toto-2.0-1B,0.25,0.0,0.5,-0.148,-0.366,-0.018
208
- AutoETS,TiRex,0.25,0.0,0.5,-0.145,-0.367,-0.025
209
- AutoETS,Toto-2.0-2.5B,0.167,0.0,0.417,-0.152,-0.369,-0.028
210
- AutoETS,Chronos-2,0.25,0.0,0.5,-0.137,-0.354,-0.02
211
- AutoETS,Toto-2.0-22m,0.167,0.0,0.417,-0.147,-0.367,-0.026
212
- AutoETS,Toto-2.0-313m,0.25,0.0,0.5,-0.147,-0.365,-0.025
213
- AutoETS,Stat. Ensemble,0.333,0.083,0.583,-0.126,-0.345,-0.012
214
- AutoETS,FlowState,0.417,0.167,0.667,-0.094,-0.322,0.04
215
- AutoETS,Toto-2.0-4m,0.25,0.0,0.5,-0.105,-0.317,0.019
216
- AutoETS,Toto-1.0,0.5,0.248,0.75,-0.065,-0.298,0.08
217
- AutoETS,TabPFN-TS,0.5,0.25,0.833,-0.092,-0.306,0.025
218
- AutoETS,AutoETS,0.5,0.5,0.5,0.0,0.0,0.0
219
- AutoETS,AutoARIMA,0.5,0.167,0.75,-0.037,-0.271,0.112
220
- AutoETS,TimesFM-2.5,0.5,0.25,0.75,-0.053,-0.259,0.072
221
- AutoETS,Chronos-Bolt,0.75,0.5,1.0,-0.039,-0.251,0.086
222
- AutoETS,Seasonal Naive,0.917,0.75,1.0,0.292,0.084,0.43
223
- AutoARIMA,TiRex-2,0.083,0.0,0.25,-0.165,-0.274,-0.08
224
- AutoARIMA,Toto-2.0-1B,0.167,0.0,0.417,-0.107,-0.211,-0.017
225
- AutoARIMA,TiRex,0.167,0.0,0.417,-0.104,-0.221,-0.019
226
- AutoARIMA,Toto-2.0-2.5B,0.167,0.0,0.417,-0.111,-0.228,-0.019
227
- AutoARIMA,Chronos-2,0.25,0.0,0.5,-0.097,-0.21,-0.009
228
- AutoARIMA,Toto-2.0-22m,0.25,0.0,0.5,-0.106,-0.221,-0.021
229
- AutoARIMA,Toto-2.0-313m,0.167,0.0,0.417,-0.106,-0.216,-0.02
230
- AutoARIMA,Stat. Ensemble,0.167,0.0,0.417,-0.086,-0.171,-0.031
231
- AutoARIMA,FlowState,0.25,0.0,0.5,-0.055,-0.113,-0.005
232
- AutoARIMA,Toto-2.0-4m,0.417,0.167,0.667,-0.065,-0.184,0.022
233
- AutoARIMA,Toto-1.0,0.333,0.083,0.583,-0.027,-0.113,0.056
234
- AutoARIMA,TabPFN-TS,0.333,0.083,0.585,-0.053,-0.154,0.02
235
- AutoARIMA,AutoETS,0.5,0.25,0.833,0.036,-0.126,0.213
236
- AutoARIMA,AutoARIMA,0.5,0.5,0.5,0.0,0.0,0.0
237
- AutoARIMA,TimesFM-2.5,0.417,0.167,0.667,-0.016,-0.097,0.062
238
- AutoARIMA,Chronos-Bolt,0.417,0.167,0.667,-0.001,-0.08,0.069
239
- AutoARIMA,Seasonal Naive,1.0,1.0,1.0,0.317,0.242,0.396
240
- TimesFM-2.5,TiRex-2,0.083,0.0,0.25,-0.147,-0.211,-0.087
241
- TimesFM-2.5,Toto-2.0-1B,0.083,0.0,0.25,-0.09,-0.13,-0.047
242
- TimesFM-2.5,TiRex,0.083,0.0,0.25,-0.087,-0.139,-0.039
243
- TimesFM-2.5,Toto-2.0-2.5B,0.083,0.0,0.25,-0.094,-0.139,-0.053
244
- TimesFM-2.5,Chronos-2,0.083,0.0,0.25,-0.08,-0.124,-0.041
245
- TimesFM-2.5,Toto-2.0-22m,0.083,0.0,0.25,-0.089,-0.15,-0.026
246
- TimesFM-2.5,Toto-2.0-313m,0.083,0.0,0.25,-0.089,-0.136,-0.042
247
- TimesFM-2.5,Stat. Ensemble,0.167,0.0,0.417,-0.069,-0.137,-0.014
248
- TimesFM-2.5,FlowState,0.333,0.125,0.583,-0.039,-0.124,0.024
249
- TimesFM-2.5,Toto-2.0-4m,0.333,0.083,0.583,-0.049,-0.126,0.026
250
- TimesFM-2.5,Toto-1.0,0.25,0.042,0.5,-0.011,-0.082,0.07
251
- TimesFM-2.5,TabPFN-TS,0.417,0.167,0.667,-0.037,-0.094,0.012
252
- TimesFM-2.5,AutoETS,0.5,0.25,0.75,0.051,-0.077,0.205
253
- TimesFM-2.5,AutoARIMA,0.583,0.333,0.833,0.015,-0.066,0.089
254
- TimesFM-2.5,TimesFM-2.5,0.5,0.5,0.5,0.0,0.0,0.0
255
- TimesFM-2.5,Chronos-Bolt,0.583,0.333,0.833,0.014,-0.034,0.072
256
- TimesFM-2.5,Seasonal Naive,0.917,0.75,1.0,0.328,0.224,0.407
257
- Chronos-Bolt,TiRex-2,0.0,0.0,0.0,-0.163,-0.242,-0.099
258
- Chronos-Bolt,Toto-2.0-1B,0.167,0.0,0.417,-0.105,-0.162,-0.05
259
- Chronos-Bolt,TiRex,0.083,0.0,0.25,-0.103,-0.164,-0.052
260
- Chronos-Bolt,Toto-2.0-2.5B,0.083,0.0,0.25,-0.109,-0.171,-0.053
261
- Chronos-Bolt,Chronos-2,0.0,0.0,0.0,-0.095,-0.165,-0.044
262
- Chronos-Bolt,Toto-2.0-22m,0.0,0.0,0.0,-0.105,-0.159,-0.058
263
- Chronos-Bolt,Toto-2.0-313m,0.083,0.0,0.25,-0.105,-0.165,-0.049
264
- Chronos-Bolt,Stat. Ensemble,0.083,0.0,0.25,-0.084,-0.151,-0.024
265
- Chronos-Bolt,FlowState,0.167,0.0,0.375,-0.053,-0.113,0.002
266
- Chronos-Bolt,Toto-2.0-4m,0.333,0.083,0.583,-0.064,-0.126,-0.01
267
- Chronos-Bolt,Toto-1.0,0.333,0.125,0.583,-0.025,-0.09,0.03
268
- Chronos-Bolt,TabPFN-TS,0.5,0.25,0.75,-0.052,-0.128,0.014
269
- Chronos-Bolt,AutoETS,0.25,0.0,0.5,0.037,-0.094,0.201
270
- Chronos-Bolt,AutoARIMA,0.583,0.333,0.833,0.001,-0.074,0.074
271
- Chronos-Bolt,TimesFM-2.5,0.417,0.167,0.667,-0.014,-0.077,0.032
272
- Chronos-Bolt,Chronos-Bolt,0.5,0.5,0.5,0.0,0.0,0.0
273
- Chronos-Bolt,Seasonal Naive,0.917,0.75,1.0,0.318,0.219,0.402
274
- Seasonal Naive,TiRex-2,0.0,0.0,0.0,-0.706,-1.009,-0.467
275
- Seasonal Naive,Toto-2.0-1B,0.083,0.0,0.25,-0.621,-0.884,-0.386
276
- Seasonal Naive,TiRex,0.0,0.0,0.0,-0.617,-0.877,-0.392
277
- Seasonal Naive,Toto-2.0-2.5B,0.0,0.0,0.0,-0.627,-0.887,-0.398
278
- Seasonal Naive,Chronos-2,0.0,0.0,0.0,-0.606,-0.842,-0.401
279
- Seasonal Naive,Toto-2.0-22m,0.0,0.0,0.0,-0.62,-0.898,-0.396
280
- Seasonal Naive,Toto-2.0-313m,0.0,0.0,0.0,-0.62,-0.881,-0.394
281
- Seasonal Naive,Stat. Ensemble,0.0,0.0,0.0,-0.59,-0.824,-0.404
282
- Seasonal Naive,FlowState,0.0,0.0,0.0,-0.545,-0.736,-0.377
283
- Seasonal Naive,Toto-2.0-4m,0.083,0.0,0.25,-0.56,-0.847,-0.326
284
- Seasonal Naive,Toto-1.0,0.083,0.0,0.25,-0.504,-0.774,-0.274
285
- Seasonal Naive,TabPFN-TS,0.0,0.0,0.0,-0.543,-0.769,-0.363
286
- Seasonal Naive,AutoETS,0.083,0.0,0.25,-0.412,-0.755,-0.091
287
- Seasonal Naive,AutoARIMA,0.0,0.0,0.0,-0.465,-0.656,-0.319
288
- Seasonal Naive,TimesFM-2.5,0.083,0.0,0.25,-0.487,-0.686,-0.288
289
- Seasonal Naive,Chronos-Bolt,0.083,0.0,0.25,-0.467,-0.673,-0.28
290
- Seasonal Naive,Seasonal Naive,0.5,0.5,0.5,0.0,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_econ/pairwise_WAPE.csv DELETED
@@ -1,290 +0,0 @@
1
- model_1,model_2,win_rate,win_rate_lower,win_rate_upper,skill_score,skill_score_lower,skill_score_upper
2
- TiRex-2,TiRex-2,0.5,0.5,0.5,0.0,0.0,0.0
3
- TiRex-2,Toto-2.0-1B,0.583,0.333,0.833,0.054,-0.019,0.135
4
- TiRex-2,Toto-2.0-2.5B,0.583,0.25,0.833,0.05,-0.021,0.117
5
- TiRex-2,Toto-2.0-313m,0.75,0.5,1.0,0.063,-0.007,0.135
6
- TiRex-2,Toto-2.0-22m,0.667,0.417,0.917,0.068,0.017,0.127
7
- TiRex-2,TiRex,0.917,0.75,1.0,0.07,0.023,0.119
8
- TiRex-2,Chronos-2,0.75,0.5,1.0,0.088,0.017,0.151
9
- TiRex-2,Stat. Ensemble,0.833,0.583,1.0,0.064,-0.008,0.14
10
- TiRex-2,Toto-1.0,0.917,0.75,1.0,0.124,0.043,0.2
11
- TiRex-2,TimesFM-2.5,0.917,0.75,1.0,0.097,0.043,0.154
12
- TiRex-2,CatBoost,0.833,0.583,1.0,0.107,-0.003,0.217
13
- TiRex-2,TabPFN-TS,0.75,0.5,1.0,0.088,0.001,0.173
14
- TiRex-2,FlowState,0.917,0.75,1.0,0.072,-0.004,0.126
15
- TiRex-2,AutoETS,0.917,0.75,1.0,0.112,0.051,0.185
16
- TiRex-2,Toto-2.0-4m,0.917,0.75,1.0,0.132,0.068,0.203
17
- TiRex-2,Chronos-Bolt,1.0,1.0,1.0,0.168,0.089,0.254
18
- TiRex-2,Seasonal Naive,1.0,1.0,1.0,0.421,0.305,0.538
19
- Toto-2.0-1B,TiRex-2,0.417,0.167,0.667,-0.058,-0.156,0.019
20
- Toto-2.0-1B,Toto-2.0-1B,0.5,0.5,0.5,0.0,0.0,0.0
21
- Toto-2.0-1B,Toto-2.0-2.5B,0.5,0.25,0.75,-0.005,-0.023,0.01
22
- Toto-2.0-1B,Toto-2.0-313m,0.667,0.417,0.917,0.009,-0.017,0.033
23
- Toto-2.0-1B,Toto-2.0-22m,0.833,0.583,1.0,0.014,-0.085,0.08
24
- Toto-2.0-1B,TiRex,0.833,0.583,1.0,0.017,-0.022,0.044
25
- Toto-2.0-1B,Chronos-2,0.75,0.5,1.0,0.035,-0.015,0.078
26
- Toto-2.0-1B,Stat. Ensemble,0.75,0.5,1.0,0.01,-0.138,0.106
27
- Toto-2.0-1B,Toto-1.0,0.667,0.417,0.917,0.073,-0.013,0.157
28
- Toto-2.0-1B,TimesFM-2.5,0.75,0.5,0.917,0.045,-0.002,0.093
29
- Toto-2.0-1B,CatBoost,0.75,0.5,1.0,0.056,-0.124,0.175
30
- Toto-2.0-1B,TabPFN-TS,0.75,0.5,1.0,0.036,-0.112,0.136
31
- Toto-2.0-1B,FlowState,0.75,0.5,1.0,0.019,-0.152,0.114
32
- Toto-2.0-1B,AutoETS,0.75,0.5,1.0,0.061,-0.038,0.14
33
- Toto-2.0-1B,Toto-2.0-4m,0.917,0.75,1.0,0.082,-0.005,0.154
34
- Toto-2.0-1B,Chronos-Bolt,0.833,0.583,1.0,0.12,0.045,0.197
35
- Toto-2.0-1B,Seasonal Naive,0.917,0.75,1.0,0.388,0.248,0.515
36
- Toto-2.0-2.5B,TiRex-2,0.417,0.167,0.75,-0.052,-0.132,0.021
37
- Toto-2.0-2.5B,Toto-2.0-1B,0.5,0.25,0.75,0.005,-0.01,0.022
38
- Toto-2.0-2.5B,Toto-2.0-2.5B,0.5,0.5,0.5,0.0,0.0,0.0
39
- Toto-2.0-2.5B,Toto-2.0-313m,0.667,0.417,0.917,0.014,-0.007,0.033
40
- Toto-2.0-2.5B,Toto-2.0-22m,0.833,0.583,1.0,0.019,-0.065,0.083
41
- Toto-2.0-2.5B,TiRex,0.75,0.5,1.0,0.022,-0.004,0.046
42
- Toto-2.0-2.5B,Chronos-2,0.667,0.417,0.917,0.04,0.0,0.076
43
- Toto-2.0-2.5B,Stat. Ensemble,0.75,0.5,1.0,0.015,-0.114,0.104
44
- Toto-2.0-2.5B,Toto-1.0,0.667,0.417,0.917,0.078,-0.001,0.164
45
- Toto-2.0-2.5B,TimesFM-2.5,0.75,0.5,0.917,0.05,0.012,0.094
46
- Toto-2.0-2.5B,CatBoost,0.75,0.5,1.0,0.06,-0.104,0.172
47
- Toto-2.0-2.5B,TabPFN-TS,0.75,0.5,1.0,0.041,-0.09,0.131
48
- Toto-2.0-2.5B,FlowState,0.75,0.5,1.0,0.023,-0.13,0.115
49
- Toto-2.0-2.5B,AutoETS,0.75,0.5,1.0,0.065,-0.017,0.138
50
- Toto-2.0-2.5B,Toto-2.0-4m,0.917,0.75,1.0,0.087,0.01,0.16
51
- Toto-2.0-2.5B,Chronos-Bolt,0.833,0.583,1.0,0.124,0.054,0.199
52
- Toto-2.0-2.5B,Seasonal Naive,0.917,0.75,1.0,0.391,0.26,0.511
53
- Toto-2.0-313m,TiRex-2,0.25,0.0,0.5,-0.067,-0.156,0.007
54
- Toto-2.0-313m,Toto-2.0-1B,0.333,0.083,0.583,-0.009,-0.034,0.017
55
- Toto-2.0-313m,Toto-2.0-2.5B,0.333,0.083,0.583,-0.014,-0.034,0.007
56
- Toto-2.0-313m,Toto-2.0-313m,0.5,0.5,0.5,0.0,0.0,0.0
57
- Toto-2.0-313m,Toto-2.0-22m,0.667,0.417,0.917,0.006,-0.071,0.063
58
- Toto-2.0-313m,TiRex,0.583,0.333,0.833,0.008,-0.021,0.035
59
- Toto-2.0-313m,Chronos-2,0.583,0.333,0.833,0.027,-0.018,0.066
60
- Toto-2.0-313m,Stat. Ensemble,0.75,0.5,1.0,0.001,-0.131,0.091
61
- Toto-2.0-313m,Toto-1.0,0.667,0.417,0.917,0.065,-0.011,0.147
62
- Toto-2.0-313m,TimesFM-2.5,0.667,0.417,0.917,0.037,-0.004,0.079
63
- Toto-2.0-313m,CatBoost,0.833,0.583,1.0,0.047,-0.108,0.154
64
- Toto-2.0-313m,TabPFN-TS,0.75,0.5,1.0,0.027,-0.108,0.124
65
- Toto-2.0-313m,FlowState,0.75,0.5,1.0,0.01,-0.142,0.106
66
- Toto-2.0-313m,AutoETS,0.667,0.417,0.917,0.052,-0.025,0.119
67
- Toto-2.0-313m,Toto-2.0-4m,0.833,0.583,1.0,0.074,0.005,0.14
68
- Toto-2.0-313m,Chronos-Bolt,0.833,0.583,1.0,0.112,0.053,0.179
69
- Toto-2.0-313m,Seasonal Naive,0.917,0.75,1.0,0.383,0.252,0.506
70
- Toto-2.0-22m,TiRex-2,0.333,0.083,0.583,-0.073,-0.145,-0.018
71
- Toto-2.0-22m,Toto-2.0-1B,0.167,0.0,0.417,-0.015,-0.086,0.078
72
- Toto-2.0-22m,Toto-2.0-2.5B,0.167,0.0,0.417,-0.02,-0.091,0.061
73
- Toto-2.0-22m,Toto-2.0-313m,0.333,0.083,0.583,-0.006,-0.067,0.066
74
- Toto-2.0-22m,Toto-2.0-22m,0.5,0.5,0.5,0.0,0.0,0.0
75
- Toto-2.0-22m,TiRex,0.5,0.248,0.75,0.002,-0.05,0.058
76
- Toto-2.0-22m,Chronos-2,0.75,0.5,1.0,0.021,-0.055,0.091
77
- Toto-2.0-22m,Stat. Ensemble,0.583,0.333,0.833,-0.004,-0.084,0.066
78
- Toto-2.0-22m,Toto-1.0,0.75,0.5,1.0,0.059,-0.005,0.12
79
- Toto-2.0-22m,TimesFM-2.5,0.667,0.417,0.917,0.031,-0.046,0.105
80
- Toto-2.0-22m,CatBoost,0.583,0.333,0.833,0.042,-0.064,0.136
81
- Toto-2.0-22m,TabPFN-TS,0.583,0.333,0.833,0.022,-0.074,0.112
82
- Toto-2.0-22m,FlowState,0.667,0.417,0.917,0.004,-0.084,0.08
83
- Toto-2.0-22m,AutoETS,0.833,0.583,1.0,0.047,-0.016,0.095
84
- Toto-2.0-22m,Toto-2.0-4m,1.0,1.0,1.0,0.069,0.048,0.092
85
- Toto-2.0-22m,Chronos-Bolt,0.917,0.75,1.0,0.107,0.057,0.155
86
- Toto-2.0-22m,Seasonal Naive,0.917,0.75,1.0,0.379,0.262,0.497
87
- TiRex,TiRex-2,0.083,0.0,0.25,-0.076,-0.135,-0.023
88
- TiRex,Toto-2.0-1B,0.167,0.0,0.417,-0.017,-0.046,0.022
89
- TiRex,Toto-2.0-2.5B,0.25,0.0,0.5,-0.022,-0.048,0.004
90
- TiRex,Toto-2.0-313m,0.417,0.167,0.667,-0.008,-0.036,0.021
91
- TiRex,Toto-2.0-22m,0.5,0.25,0.752,-0.002,-0.061,0.048
92
- TiRex,TiRex,0.5,0.5,0.5,0.0,0.0,0.0
93
- TiRex,Chronos-2,0.667,0.333,0.917,0.019,-0.026,0.055
94
- TiRex,Stat. Ensemble,0.583,0.333,0.833,-0.007,-0.118,0.073
95
- TiRex,Toto-1.0,0.5,0.25,0.833,0.057,-0.011,0.131
96
- TiRex,TimesFM-2.5,0.833,0.667,1.0,0.029,-0.01,0.066
97
- TiRex,CatBoost,0.667,0.417,0.917,0.039,-0.111,0.151
98
- TiRex,TabPFN-TS,0.75,0.5,1.0,0.019,-0.098,0.11
99
- TiRex,FlowState,0.667,0.417,0.917,0.002,-0.132,0.081
100
- TiRex,AutoETS,0.667,0.417,0.917,0.045,-0.022,0.113
101
- TiRex,Toto-2.0-4m,0.75,0.5,1.0,0.067,0.006,0.127
102
- TiRex,Chronos-Bolt,0.917,0.75,1.0,0.105,0.043,0.176
103
- TiRex,Seasonal Naive,0.917,0.75,1.0,0.378,0.252,0.503
104
- Chronos-2,TiRex-2,0.25,0.0,0.5,-0.096,-0.178,-0.018
105
- Chronos-2,Toto-2.0-1B,0.25,0.0,0.5,-0.037,-0.085,0.015
106
- Chronos-2,Toto-2.0-2.5B,0.333,0.083,0.583,-0.042,-0.082,-0.0
107
- Chronos-2,Toto-2.0-313m,0.417,0.167,0.667,-0.028,-0.07,0.018
108
- Chronos-2,Toto-2.0-22m,0.25,0.0,0.5,-0.022,-0.1,0.052
109
- Chronos-2,TiRex,0.333,0.083,0.667,-0.019,-0.059,0.025
110
- Chronos-2,Chronos-2,0.5,0.5,0.5,0.0,0.0,0.0
111
- Chronos-2,Stat. Ensemble,0.667,0.417,0.917,-0.026,-0.142,0.05
112
- Chronos-2,Toto-1.0,0.5,0.25,0.833,0.039,-0.047,0.129
113
- Chronos-2,TimesFM-2.5,0.5,0.167,0.75,0.01,-0.025,0.05
114
- Chronos-2,CatBoost,0.583,0.333,0.833,0.021,-0.142,0.136
115
- Chronos-2,TabPFN-TS,0.667,0.417,0.917,0.0,-0.134,0.102
116
- Chronos-2,FlowState,0.583,0.333,0.833,-0.017,-0.169,0.081
117
- Chronos-2,AutoETS,0.667,0.417,0.917,0.026,-0.04,0.085
118
- Chronos-2,Toto-2.0-4m,0.583,0.333,0.833,0.049,-0.031,0.135
119
- Chronos-2,Chronos-Bolt,0.75,0.5,1.0,0.087,0.014,0.175
120
- Chronos-2,Seasonal Naive,0.917,0.75,1.0,0.366,0.237,0.489
121
- Stat. Ensemble,TiRex-2,0.167,0.0,0.417,-0.068,-0.163,0.008
122
- Stat. Ensemble,Toto-2.0-1B,0.25,0.0,0.5,-0.01,-0.119,0.121
123
- Stat. Ensemble,Toto-2.0-2.5B,0.25,0.0,0.5,-0.015,-0.116,0.103
124
- Stat. Ensemble,Toto-2.0-313m,0.25,0.0,0.5,-0.001,-0.1,0.116
125
- Stat. Ensemble,Toto-2.0-22m,0.417,0.167,0.667,0.004,-0.071,0.077
126
- Stat. Ensemble,TiRex,0.417,0.167,0.667,0.007,-0.079,0.105
127
- Stat. Ensemble,Chronos-2,0.333,0.083,0.583,0.026,-0.052,0.124
128
- Stat. Ensemble,Stat. Ensemble,0.5,0.5,0.5,0.0,0.0,0.0
129
- Stat. Ensemble,Toto-1.0,0.583,0.25,0.833,0.064,-0.025,0.153
130
- Stat. Ensemble,TimesFM-2.5,0.5,0.25,0.75,0.036,-0.044,0.138
131
- Stat. Ensemble,CatBoost,0.5,0.25,0.75,0.046,-0.019,0.117
132
- Stat. Ensemble,TabPFN-TS,0.583,0.333,0.833,0.026,-0.033,0.082
133
- Stat. Ensemble,FlowState,0.667,0.417,0.917,0.009,-0.049,0.064
134
- Stat. Ensemble,AutoETS,0.75,0.5,1.0,0.051,0.006,0.104
135
- Stat. Ensemble,Toto-2.0-4m,0.583,0.333,0.833,0.073,-0.009,0.154
136
- Stat. Ensemble,Chronos-Bolt,0.75,0.5,1.0,0.111,0.016,0.202
137
- Stat. Ensemble,Seasonal Naive,1.0,1.0,1.0,0.382,0.284,0.478
138
- Toto-1.0,TiRex-2,0.083,0.0,0.25,-0.141,-0.249,-0.045
139
- Toto-1.0,Toto-2.0-1B,0.333,0.083,0.583,-0.079,-0.187,0.013
140
- Toto-1.0,Toto-2.0-2.5B,0.333,0.083,0.583,-0.084,-0.196,0.001
141
- Toto-1.0,Toto-2.0-313m,0.333,0.083,0.583,-0.069,-0.173,0.011
142
- Toto-1.0,Toto-2.0-22m,0.25,0.0,0.5,-0.063,-0.136,0.005
143
- Toto-1.0,TiRex,0.5,0.167,0.75,-0.061,-0.151,0.011
144
- Toto-1.0,Chronos-2,0.5,0.167,0.75,-0.041,-0.149,0.045
145
- Toto-1.0,Stat. Ensemble,0.417,0.167,0.75,-0.068,-0.181,0.024
146
- Toto-1.0,Toto-1.0,0.5,0.5,0.5,0.0,0.0,0.0
147
- Toto-1.0,TimesFM-2.5,0.583,0.333,0.833,-0.03,-0.139,0.05
148
- Toto-1.0,CatBoost,0.583,0.25,0.833,-0.019,-0.168,0.102
149
- Toto-1.0,TabPFN-TS,0.583,0.333,0.833,-0.04,-0.192,0.084
150
- Toto-1.0,FlowState,0.5,0.25,0.75,-0.059,-0.205,0.059
151
- Toto-1.0,AutoETS,0.5,0.25,0.75,-0.013,-0.1,0.062
152
- Toto-1.0,Toto-2.0-4m,0.5,0.248,0.75,0.01,-0.051,0.066
153
- Toto-1.0,Chronos-Bolt,0.75,0.542,0.958,0.05,0.006,0.093
154
- Toto-1.0,Seasonal Naive,0.917,0.75,1.0,0.34,0.203,0.463
155
- TimesFM-2.5,TiRex-2,0.083,0.0,0.25,-0.108,-0.182,-0.045
156
- TimesFM-2.5,Toto-2.0-1B,0.25,0.083,0.5,-0.048,-0.103,0.002
157
- TimesFM-2.5,Toto-2.0-2.5B,0.25,0.083,0.5,-0.053,-0.103,-0.012
158
- TimesFM-2.5,Toto-2.0-313m,0.333,0.083,0.583,-0.038,-0.085,0.004
159
- TimesFM-2.5,Toto-2.0-22m,0.333,0.083,0.583,-0.032,-0.118,0.044
160
- TimesFM-2.5,TiRex,0.167,0.0,0.333,-0.03,-0.071,0.01
161
- TimesFM-2.5,Chronos-2,0.5,0.25,0.833,-0.011,-0.052,0.025
162
- TimesFM-2.5,Stat. Ensemble,0.5,0.25,0.75,-0.037,-0.161,0.042
163
- TimesFM-2.5,Toto-1.0,0.417,0.167,0.667,0.029,-0.053,0.122
164
- TimesFM-2.5,TimesFM-2.5,0.5,0.5,0.5,0.0,0.0,0.0
165
- TimesFM-2.5,CatBoost,0.667,0.417,0.917,0.011,-0.151,0.126
166
- TimesFM-2.5,TabPFN-TS,0.5,0.25,0.75,-0.01,-0.144,0.086
167
- TimesFM-2.5,FlowState,0.417,0.167,0.667,-0.028,-0.174,0.06
168
- TimesFM-2.5,AutoETS,0.583,0.331,0.833,0.016,-0.058,0.087
169
- TimesFM-2.5,Toto-2.0-4m,0.583,0.333,0.833,0.039,-0.044,0.124
170
- TimesFM-2.5,Chronos-Bolt,0.667,0.417,0.875,0.078,0.002,0.167
171
- TimesFM-2.5,Seasonal Naive,0.917,0.75,1.0,0.359,0.235,0.479
172
- CatBoost,TiRex-2,0.167,0.0,0.417,-0.12,-0.278,0.003
173
- CatBoost,Toto-2.0-1B,0.25,0.0,0.5,-0.059,-0.212,0.11
174
- CatBoost,Toto-2.0-2.5B,0.25,0.0,0.5,-0.064,-0.208,0.094
175
- CatBoost,Toto-2.0-313m,0.167,0.0,0.417,-0.05,-0.181,0.097
176
- CatBoost,Toto-2.0-22m,0.417,0.167,0.667,-0.044,-0.157,0.06
177
- CatBoost,TiRex,0.333,0.083,0.583,-0.041,-0.178,0.1
178
- CatBoost,Chronos-2,0.417,0.167,0.667,-0.021,-0.157,0.125
179
- CatBoost,Stat. Ensemble,0.5,0.25,0.75,-0.048,-0.133,0.018
180
- CatBoost,Toto-1.0,0.417,0.167,0.75,0.019,-0.114,0.144
181
- CatBoost,TimesFM-2.5,0.333,0.083,0.583,-0.011,-0.145,0.131
182
- CatBoost,CatBoost,0.5,0.5,0.5,0.0,0.0,0.0
183
- CatBoost,TabPFN-TS,0.5,0.25,0.75,-0.021,-0.113,0.061
184
- CatBoost,FlowState,0.5,0.25,0.75,-0.039,-0.146,0.029
185
- CatBoost,AutoETS,0.583,0.25,0.833,0.006,-0.085,0.101
186
- CatBoost,Toto-2.0-4m,0.583,0.25,0.833,0.028,-0.083,0.129
187
- CatBoost,Chronos-Bolt,0.583,0.25,0.833,0.068,-0.042,0.181
188
- CatBoost,Seasonal Naive,1.0,1.0,1.0,0.352,0.249,0.443
189
- TabPFN-TS,TiRex-2,0.25,0.0,0.5,-0.097,-0.209,-0.001
190
- TabPFN-TS,Toto-2.0-1B,0.25,0.0,0.5,-0.037,-0.158,0.101
191
- TabPFN-TS,Toto-2.0-2.5B,0.25,0.0,0.5,-0.042,-0.151,0.082
192
- TabPFN-TS,Toto-2.0-313m,0.25,0.0,0.5,-0.028,-0.142,0.097
193
- TabPFN-TS,Toto-2.0-22m,0.417,0.167,0.667,-0.022,-0.126,0.069
194
- TabPFN-TS,TiRex,0.25,0.0,0.5,-0.02,-0.124,0.089
195
- TabPFN-TS,Chronos-2,0.333,0.083,0.583,-0.0,-0.113,0.119
196
- TabPFN-TS,Stat. Ensemble,0.417,0.167,0.667,-0.027,-0.089,0.032
197
- TabPFN-TS,Toto-1.0,0.417,0.167,0.667,0.039,-0.092,0.161
198
- TabPFN-TS,TimesFM-2.5,0.5,0.25,0.75,0.01,-0.095,0.126
199
- TabPFN-TS,CatBoost,0.5,0.25,0.75,0.021,-0.065,0.101
200
- TabPFN-TS,TabPFN-TS,0.5,0.5,0.5,0.0,0.0,0.0
201
- TabPFN-TS,FlowState,0.333,0.083,0.583,-0.018,-0.086,0.053
202
- TabPFN-TS,AutoETS,0.667,0.417,0.917,0.026,-0.063,0.099
203
- TabPFN-TS,Toto-2.0-4m,0.583,0.331,0.833,0.048,-0.067,0.151
204
- TabPFN-TS,Chronos-Bolt,0.583,0.331,0.833,0.087,-0.047,0.2
205
- TabPFN-TS,Seasonal Naive,1.0,1.0,1.0,0.365,0.273,0.457
206
- FlowState,TiRex-2,0.083,0.0,0.25,-0.078,-0.144,0.004
207
- FlowState,Toto-2.0-1B,0.25,0.0,0.5,-0.019,-0.129,0.132
208
- FlowState,Toto-2.0-2.5B,0.25,0.0,0.5,-0.024,-0.13,0.115
209
- FlowState,Toto-2.0-313m,0.25,0.0,0.5,-0.01,-0.119,0.124
210
- FlowState,Toto-2.0-22m,0.333,0.083,0.583,-0.004,-0.087,0.077
211
- FlowState,TiRex,0.333,0.083,0.583,-0.002,-0.088,0.117
212
- FlowState,Chronos-2,0.417,0.167,0.667,0.017,-0.088,0.144
213
- FlowState,Stat. Ensemble,0.333,0.083,0.583,-0.009,-0.068,0.047
214
- FlowState,Toto-1.0,0.5,0.25,0.75,0.056,-0.062,0.17
215
- FlowState,TimesFM-2.5,0.583,0.333,0.833,0.027,-0.064,0.149
216
- FlowState,CatBoost,0.5,0.25,0.75,0.038,-0.03,0.127
217
- FlowState,TabPFN-TS,0.667,0.417,0.917,0.018,-0.056,0.079
218
- FlowState,FlowState,0.5,0.5,0.5,0.0,0.0,0.0
219
- FlowState,AutoETS,0.5,0.25,0.75,0.043,-0.045,0.131
220
- FlowState,Toto-2.0-4m,0.417,0.167,0.667,0.065,-0.028,0.157
221
- FlowState,Chronos-Bolt,0.583,0.332,0.833,0.103,-0.011,0.214
222
- FlowState,Seasonal Naive,0.917,0.75,1.0,0.376,0.258,0.488
223
- AutoETS,TiRex-2,0.083,0.0,0.25,-0.126,-0.227,-0.054
224
- AutoETS,Toto-2.0-1B,0.25,0.0,0.5,-0.065,-0.163,0.036
225
- AutoETS,Toto-2.0-2.5B,0.25,0.0,0.5,-0.07,-0.16,0.017
226
- AutoETS,Toto-2.0-313m,0.333,0.083,0.583,-0.055,-0.135,0.025
227
- AutoETS,Toto-2.0-22m,0.167,0.0,0.417,-0.049,-0.105,0.016
228
- AutoETS,TiRex,0.333,0.083,0.583,-0.047,-0.127,0.022
229
- AutoETS,Chronos-2,0.333,0.083,0.583,-0.027,-0.093,0.039
230
- AutoETS,Stat. Ensemble,0.25,0.0,0.5,-0.054,-0.115,-0.006
231
- AutoETS,Toto-1.0,0.5,0.25,0.75,0.013,-0.066,0.091
232
- AutoETS,TimesFM-2.5,0.417,0.167,0.669,-0.016,-0.095,0.055
233
- AutoETS,CatBoost,0.417,0.167,0.75,-0.006,-0.113,0.079
234
- AutoETS,TabPFN-TS,0.333,0.083,0.583,-0.027,-0.11,0.059
235
- AutoETS,FlowState,0.5,0.25,0.75,-0.045,-0.151,0.043
236
- AutoETS,AutoETS,0.5,0.5,0.5,0.0,0.0,0.0
237
- AutoETS,Toto-2.0-4m,0.417,0.167,0.667,0.023,-0.034,0.101
238
- AutoETS,Chronos-Bolt,0.667,0.333,0.917,0.063,-0.003,0.135
239
- AutoETS,Seasonal Naive,1.0,1.0,1.0,0.348,0.248,0.455
240
- Toto-2.0-4m,TiRex-2,0.083,0.0,0.25,-0.152,-0.255,-0.073
241
- Toto-2.0-4m,Toto-2.0-1B,0.083,0.0,0.25,-0.09,-0.182,0.005
242
- Toto-2.0-4m,Toto-2.0-2.5B,0.083,0.0,0.25,-0.095,-0.19,-0.011
243
- Toto-2.0-4m,Toto-2.0-313m,0.167,0.0,0.417,-0.08,-0.163,-0.005
244
- Toto-2.0-4m,Toto-2.0-22m,0.0,0.0,0.0,-0.074,-0.101,-0.051
245
- Toto-2.0-4m,TiRex,0.25,0.0,0.5,-0.071,-0.145,-0.006
246
- Toto-2.0-4m,Chronos-2,0.417,0.167,0.667,-0.051,-0.155,0.03
247
- Toto-2.0-4m,Stat. Ensemble,0.417,0.167,0.667,-0.079,-0.182,0.009
248
- Toto-2.0-4m,Toto-1.0,0.5,0.25,0.752,-0.01,-0.071,0.048
249
- Toto-2.0-4m,TimesFM-2.5,0.417,0.167,0.667,-0.04,-0.142,0.043
250
- Toto-2.0-4m,CatBoost,0.417,0.167,0.75,-0.029,-0.148,0.077
251
- Toto-2.0-4m,TabPFN-TS,0.417,0.167,0.669,-0.051,-0.178,0.063
252
- Toto-2.0-4m,FlowState,0.583,0.333,0.833,-0.069,-0.186,0.027
253
- Toto-2.0-4m,AutoETS,0.583,0.333,0.833,-0.023,-0.112,0.033
254
- Toto-2.0-4m,Toto-2.0-4m,0.5,0.5,0.5,0.0,0.0,0.0
255
- Toto-2.0-4m,Chronos-Bolt,0.75,0.5,1.0,0.041,0.002,0.082
256
- Toto-2.0-4m,Seasonal Naive,0.917,0.75,1.0,0.333,0.197,0.46
257
- Chronos-Bolt,TiRex-2,0.0,0.0,0.0,-0.201,-0.34,-0.098
258
- Chronos-Bolt,Toto-2.0-1B,0.167,0.0,0.417,-0.136,-0.246,-0.047
259
- Chronos-Bolt,Toto-2.0-2.5B,0.167,0.0,0.417,-0.142,-0.249,-0.058
260
- Chronos-Bolt,Toto-2.0-313m,0.167,0.0,0.417,-0.126,-0.218,-0.055
261
- Chronos-Bolt,Toto-2.0-22m,0.083,0.0,0.25,-0.12,-0.184,-0.061
262
- Chronos-Bolt,TiRex,0.083,0.0,0.25,-0.117,-0.213,-0.045
263
- Chronos-Bolt,Chronos-2,0.25,0.0,0.5,-0.096,-0.213,-0.014
264
- Chronos-Bolt,Stat. Ensemble,0.25,0.0,0.5,-0.125,-0.253,-0.016
265
- Chronos-Bolt,Toto-1.0,0.25,0.042,0.458,-0.053,-0.102,-0.006
266
- Chronos-Bolt,TimesFM-2.5,0.333,0.125,0.583,-0.084,-0.2,-0.002
267
- Chronos-Bolt,CatBoost,0.417,0.167,0.75,-0.073,-0.221,0.041
268
- Chronos-Bolt,TabPFN-TS,0.417,0.167,0.669,-0.095,-0.249,0.045
269
- Chronos-Bolt,FlowState,0.417,0.167,0.668,-0.115,-0.272,0.01
270
- Chronos-Bolt,AutoETS,0.333,0.083,0.667,-0.067,-0.156,0.003
271
- Chronos-Bolt,Toto-2.0-4m,0.25,0.0,0.5,-0.042,-0.089,-0.002
272
- Chronos-Bolt,Chronos-Bolt,0.5,0.5,0.5,0.0,0.0,0.0
273
- Chronos-Bolt,Seasonal Naive,0.833,0.583,1.0,0.305,0.17,0.432
274
- Seasonal Naive,TiRex-2,0.0,0.0,0.0,-0.728,-1.165,-0.439
275
- Seasonal Naive,Toto-2.0-1B,0.083,0.0,0.25,-0.634,-1.063,-0.329
276
- Seasonal Naive,Toto-2.0-2.5B,0.083,0.0,0.25,-0.642,-1.045,-0.352
277
- Seasonal Naive,Toto-2.0-313m,0.083,0.0,0.25,-0.62,-1.022,-0.337
278
- Seasonal Naive,Toto-2.0-22m,0.083,0.0,0.25,-0.61,-0.988,-0.356
279
- Seasonal Naive,TiRex,0.083,0.0,0.25,-0.607,-1.014,-0.337
280
- Seasonal Naive,Chronos-2,0.083,0.0,0.25,-0.576,-0.957,-0.311
281
- Seasonal Naive,Stat. Ensemble,0.0,0.0,0.0,-0.618,-0.915,-0.396
282
- Seasonal Naive,Toto-1.0,0.083,0.0,0.25,-0.515,-0.863,-0.255
283
- Seasonal Naive,TimesFM-2.5,0.083,0.0,0.25,-0.56,-0.92,-0.308
284
- Seasonal Naive,CatBoost,0.0,0.0,0.0,-0.543,-0.796,-0.331
285
- Seasonal Naive,TabPFN-TS,0.0,0.0,0.0,-0.576,-0.842,-0.375
286
- Seasonal Naive,FlowState,0.083,0.0,0.25,-0.604,-0.954,-0.348
287
- Seasonal Naive,AutoETS,0.0,0.0,0.0,-0.535,-0.834,-0.33
288
- Seasonal Naive,Toto-2.0-4m,0.083,0.0,0.25,-0.5,-0.851,-0.245
289
- Seasonal Naive,Chronos-Bolt,0.167,0.0,0.417,-0.438,-0.76,-0.205
290
- Seasonal Naive,Seasonal Naive,0.5,0.5,0.5,0.0,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_econ/pairwise_WQL.csv DELETED
@@ -1,257 +0,0 @@
1
- model_1,model_2,win_rate,win_rate_lower,win_rate_upper,skill_score,skill_score_lower,skill_score_upper
2
- TiRex-2,TiRex-2,0.5,0.5,0.5,0.0,0.0,0.0
3
- TiRex-2,Toto-2.0-1B,0.667,0.333,0.917,0.055,-0.019,0.139
4
- TiRex-2,Toto-2.0-2.5B,0.583,0.25,0.833,0.048,-0.025,0.117
5
- TiRex-2,Toto-2.0-313m,0.833,0.583,1.0,0.06,-0.008,0.128
6
- TiRex-2,TiRex,0.917,0.75,1.0,0.06,0.02,0.102
7
- TiRex-2,Toto-2.0-22m,0.75,0.5,0.917,0.056,-0.002,0.12
8
- TiRex-2,Chronos-2,0.833,0.583,1.0,0.078,0.01,0.141
9
- TiRex-2,FlowState,0.917,0.75,1.0,0.078,-0.002,0.138
10
- TiRex-2,Toto-1.0,0.917,0.75,1.0,0.12,0.047,0.19
11
- TiRex-2,TabPFN-TS,0.667,0.417,0.917,0.089,0.016,0.164
12
- TiRex-2,TimesFM-2.5,0.917,0.75,1.0,0.103,0.049,0.166
13
- TiRex-2,Toto-2.0-4m,0.917,0.75,1.0,0.116,0.049,0.192
14
- TiRex-2,Stat. Ensemble,0.833,0.583,1.0,0.122,0.04,0.196
15
- TiRex-2,Chronos-Bolt,1.0,1.0,1.0,0.155,0.081,0.238
16
- TiRex-2,AutoETS,0.917,0.75,1.0,0.139,0.08,0.207
17
- TiRex-2,Seasonal Naive,1.0,1.0,1.0,0.455,0.337,0.57
18
- Toto-2.0-1B,TiRex-2,0.333,0.083,0.667,-0.059,-0.161,0.019
19
- Toto-2.0-1B,Toto-2.0-1B,0.5,0.5,0.5,0.0,0.0,0.0
20
- Toto-2.0-1B,Toto-2.0-2.5B,0.333,0.083,0.583,-0.008,-0.037,0.017
21
- Toto-2.0-1B,Toto-2.0-313m,0.833,0.583,1.0,0.005,-0.033,0.035
22
- Toto-2.0-1B,TiRex,0.667,0.417,0.917,0.004,-0.047,0.042
23
- Toto-2.0-1B,Toto-2.0-22m,0.833,0.583,1.0,0.001,-0.102,0.066
24
- Toto-2.0-1B,Chronos-2,0.75,0.5,1.0,0.024,-0.03,0.068
25
- Toto-2.0-1B,FlowState,0.833,0.583,1.0,0.024,-0.148,0.118
26
- Toto-2.0-1B,Toto-1.0,0.75,0.5,1.0,0.069,-0.007,0.141
27
- Toto-2.0-1B,TabPFN-TS,0.833,0.583,1.0,0.036,-0.093,0.128
28
- Toto-2.0-1B,TimesFM-2.5,0.75,0.5,0.917,0.051,0.008,0.092
29
- Toto-2.0-1B,Toto-2.0-4m,0.833,0.583,1.0,0.065,-0.05,0.147
30
- Toto-2.0-1B,Stat. Ensemble,0.75,0.5,1.0,0.07,-0.103,0.189
31
- Toto-2.0-1B,Chronos-Bolt,0.917,0.75,1.0,0.106,0.031,0.179
32
- Toto-2.0-1B,AutoETS,0.75,0.5,1.0,0.088,-0.019,0.161
33
- Toto-2.0-1B,Seasonal Naive,0.917,0.75,1.0,0.424,0.268,0.551
34
- Toto-2.0-2.5B,TiRex-2,0.417,0.167,0.75,-0.05,-0.132,0.024
35
- Toto-2.0-2.5B,Toto-2.0-1B,0.667,0.417,0.917,0.008,-0.017,0.035
36
- Toto-2.0-2.5B,Toto-2.0-2.5B,0.5,0.5,0.5,0.0,0.0,0.0
37
- Toto-2.0-2.5B,Toto-2.0-313m,0.667,0.417,0.917,0.012,-0.006,0.031
38
- Toto-2.0-2.5B,TiRex,0.5,0.25,0.752,0.012,-0.023,0.05
39
- Toto-2.0-2.5B,Toto-2.0-22m,0.667,0.417,0.917,0.008,-0.067,0.071
40
- Toto-2.0-2.5B,Chronos-2,0.667,0.417,0.917,0.031,-0.005,0.066
41
- Toto-2.0-2.5B,FlowState,0.75,0.5,1.0,0.032,-0.113,0.118
42
- Toto-2.0-2.5B,Toto-1.0,0.75,0.5,1.0,0.076,0.004,0.152
43
- Toto-2.0-2.5B,TabPFN-TS,0.75,0.5,1.0,0.043,-0.062,0.119
44
- Toto-2.0-2.5B,TimesFM-2.5,0.75,0.5,1.0,0.058,0.023,0.098
45
- Toto-2.0-2.5B,Toto-2.0-4m,0.833,0.583,1.0,0.072,-0.015,0.154
46
- Toto-2.0-2.5B,Stat. Ensemble,0.75,0.5,1.0,0.078,-0.064,0.184
47
- Toto-2.0-2.5B,Chronos-Bolt,0.833,0.583,1.0,0.113,0.048,0.183
48
- Toto-2.0-2.5B,AutoETS,0.75,0.5,1.0,0.095,0.016,0.157
49
- Toto-2.0-2.5B,Seasonal Naive,0.917,0.75,1.0,0.428,0.293,0.546
50
- Toto-2.0-313m,TiRex-2,0.167,0.0,0.417,-0.063,-0.147,0.008
51
- Toto-2.0-313m,Toto-2.0-1B,0.167,0.0,0.417,-0.005,-0.036,0.032
52
- Toto-2.0-313m,Toto-2.0-2.5B,0.333,0.083,0.583,-0.013,-0.032,0.006
53
- Toto-2.0-313m,Toto-2.0-313m,0.5,0.5,0.5,0.0,0.0,0.0
54
- Toto-2.0-313m,TiRex,0.667,0.417,0.917,-0.0,-0.036,0.031
55
- Toto-2.0-313m,Toto-2.0-22m,0.75,0.5,1.0,-0.004,-0.07,0.045
56
- Toto-2.0-313m,Chronos-2,0.583,0.333,0.833,0.019,-0.026,0.058
57
- Toto-2.0-313m,FlowState,0.75,0.5,1.0,0.02,-0.121,0.107
58
- Toto-2.0-313m,Toto-1.0,0.75,0.5,1.0,0.064,0.003,0.132
59
- Toto-2.0-313m,TabPFN-TS,0.667,0.417,0.917,0.032,-0.07,0.111
60
- Toto-2.0-313m,TimesFM-2.5,0.75,0.5,1.0,0.046,0.006,0.086
61
- Toto-2.0-313m,Toto-2.0-4m,0.833,0.583,1.0,0.06,-0.02,0.135
62
- Toto-2.0-313m,Stat. Ensemble,0.75,0.5,1.0,0.066,-0.074,0.17
63
- Toto-2.0-313m,Chronos-Bolt,0.833,0.583,1.0,0.102,0.048,0.161
64
- Toto-2.0-313m,AutoETS,0.75,0.5,1.0,0.084,0.01,0.142
65
- Toto-2.0-313m,Seasonal Naive,0.917,0.75,1.0,0.421,0.285,0.539
66
- TiRex,TiRex-2,0.083,0.0,0.25,-0.063,-0.114,-0.021
67
- TiRex,Toto-2.0-1B,0.333,0.083,0.583,-0.005,-0.044,0.045
68
- TiRex,Toto-2.0-2.5B,0.5,0.248,0.75,-0.012,-0.052,0.022
69
- TiRex,Toto-2.0-313m,0.333,0.083,0.583,0.0,-0.031,0.034
70
- TiRex,TiRex,0.5,0.5,0.5,0.0,0.0,0.0
71
- TiRex,Toto-2.0-22m,0.417,0.167,0.667,-0.004,-0.057,0.046
72
- TiRex,Chronos-2,0.583,0.333,0.833,0.019,-0.029,0.058
73
- TiRex,FlowState,0.75,0.5,1.0,0.02,-0.099,0.09
74
- TiRex,Toto-1.0,0.667,0.333,0.917,0.064,0.009,0.124
75
- TiRex,TabPFN-TS,0.75,0.5,1.0,0.032,-0.059,0.112
76
- TiRex,TimesFM-2.5,0.833,0.667,1.0,0.047,0.005,0.084
77
- TiRex,Toto-2.0-4m,0.75,0.5,1.0,0.06,-0.009,0.128
78
- TiRex,Stat. Ensemble,0.75,0.5,1.0,0.066,-0.055,0.161
79
- TiRex,Chronos-Bolt,0.917,0.75,1.0,0.102,0.047,0.167
80
- TiRex,AutoETS,0.833,0.583,1.0,0.084,0.017,0.145
81
- TiRex,Seasonal Naive,1.0,1.0,1.0,0.421,0.287,0.546
82
- Toto-2.0-22m,TiRex-2,0.25,0.083,0.5,-0.059,-0.136,0.002
83
- Toto-2.0-22m,Toto-2.0-1B,0.167,0.0,0.417,-0.001,-0.071,0.093
84
- Toto-2.0-22m,Toto-2.0-2.5B,0.333,0.083,0.583,-0.008,-0.076,0.063
85
- Toto-2.0-22m,Toto-2.0-313m,0.25,0.0,0.5,0.004,-0.047,0.066
86
- Toto-2.0-22m,TiRex,0.583,0.333,0.833,0.004,-0.048,0.054
87
- Toto-2.0-22m,Toto-2.0-22m,0.5,0.5,0.5,0.0,0.0,0.0
88
- Toto-2.0-22m,Chronos-2,0.75,0.5,1.0,0.023,-0.054,0.089
89
- Toto-2.0-22m,FlowState,0.583,0.333,0.833,0.024,-0.06,0.092
90
- Toto-2.0-22m,Toto-1.0,0.833,0.583,1.0,0.068,0.015,0.122
91
- Toto-2.0-22m,TabPFN-TS,0.583,0.333,0.833,0.035,-0.049,0.113
92
- Toto-2.0-22m,TimesFM-2.5,0.75,0.5,1.0,0.05,-0.027,0.127
93
- Toto-2.0-22m,Toto-2.0-4m,1.0,1.0,1.0,0.064,0.041,0.091
94
- Toto-2.0-22m,Stat. Ensemble,0.667,0.417,0.917,0.07,-0.032,0.161
95
- Toto-2.0-22m,Chronos-Bolt,0.917,0.75,1.0,0.105,0.063,0.147
96
- Toto-2.0-22m,AutoETS,0.917,0.75,1.0,0.088,0.02,0.13
97
- Toto-2.0-22m,Seasonal Naive,0.917,0.75,1.0,0.423,0.3,0.539
98
- Chronos-2,TiRex-2,0.167,0.0,0.417,-0.084,-0.164,-0.01
99
- Chronos-2,Toto-2.0-1B,0.25,0.0,0.5,-0.024,-0.072,0.029
100
- Chronos-2,Toto-2.0-2.5B,0.333,0.083,0.583,-0.032,-0.07,0.005
101
- Chronos-2,Toto-2.0-313m,0.417,0.167,0.667,-0.019,-0.061,0.025
102
- Chronos-2,TiRex,0.417,0.167,0.667,-0.02,-0.062,0.028
103
- Chronos-2,Toto-2.0-22m,0.25,0.0,0.5,-0.024,-0.098,0.052
104
- Chronos-2,Chronos-2,0.5,0.5,0.5,0.0,0.0,0.0
105
- Chronos-2,FlowState,0.583,0.333,0.833,0.001,-0.142,0.096
106
- Chronos-2,Toto-1.0,0.5,0.25,0.833,0.046,-0.028,0.132
107
- Chronos-2,TabPFN-TS,0.667,0.417,0.917,0.013,-0.089,0.095
108
- Chronos-2,TimesFM-2.5,0.667,0.333,0.917,0.028,-0.008,0.061
109
- Chronos-2,Toto-2.0-4m,0.667,0.415,0.917,0.042,-0.047,0.135
110
- Chronos-2,Stat. Ensemble,0.833,0.583,1.0,0.048,-0.082,0.141
111
- Chronos-2,Chronos-Bolt,0.667,0.417,0.917,0.084,0.014,0.167
112
- Chronos-2,AutoETS,0.917,0.75,1.0,0.066,0.004,0.112
113
- Chronos-2,Seasonal Naive,0.917,0.75,1.0,0.41,0.281,0.527
114
- FlowState,TiRex-2,0.083,0.0,0.25,-0.085,-0.16,0.002
115
- FlowState,Toto-2.0-1B,0.167,0.0,0.417,-0.025,-0.134,0.129
116
- FlowState,Toto-2.0-2.5B,0.25,0.0,0.5,-0.033,-0.134,0.102
117
- FlowState,Toto-2.0-313m,0.25,0.0,0.5,-0.02,-0.119,0.108
118
- FlowState,TiRex,0.25,0.0,0.5,-0.02,-0.099,0.09
119
- FlowState,Toto-2.0-22m,0.417,0.167,0.667,-0.025,-0.101,0.057
120
- FlowState,Chronos-2,0.417,0.167,0.667,-0.001,-0.106,0.124
121
- FlowState,FlowState,0.5,0.5,0.5,0.0,0.0,0.0
122
- FlowState,Toto-1.0,0.583,0.332,0.833,0.045,-0.064,0.156
123
- FlowState,TabPFN-TS,0.667,0.417,0.917,0.012,-0.07,0.076
124
- FlowState,TimesFM-2.5,0.583,0.333,0.833,0.027,-0.07,0.156
125
- FlowState,Toto-2.0-4m,0.5,0.25,0.75,0.041,-0.039,0.119
126
- FlowState,Stat. Ensemble,0.583,0.333,0.833,0.047,-0.025,0.119
127
- FlowState,Chronos-Bolt,0.583,0.332,0.833,0.083,-0.022,0.187
128
- FlowState,AutoETS,0.667,0.417,0.917,0.065,-0.019,0.146
129
- FlowState,Seasonal Naive,0.917,0.75,1.0,0.409,0.289,0.52
130
- Toto-1.0,TiRex-2,0.083,0.0,0.25,-0.137,-0.234,-0.049
131
- Toto-1.0,Toto-2.0-1B,0.25,0.0,0.5,-0.074,-0.164,0.007
132
- Toto-1.0,Toto-2.0-2.5B,0.25,0.0,0.5,-0.082,-0.179,-0.004
133
- Toto-1.0,Toto-2.0-313m,0.25,0.0,0.5,-0.069,-0.151,-0.003
134
- Toto-1.0,TiRex,0.333,0.083,0.667,-0.069,-0.142,-0.009
135
- Toto-1.0,Toto-2.0-22m,0.167,0.0,0.417,-0.073,-0.139,-0.015
136
- Toto-1.0,Chronos-2,0.5,0.167,0.75,-0.048,-0.153,0.028
137
- Toto-1.0,FlowState,0.417,0.167,0.668,-0.047,-0.184,0.06
138
- Toto-1.0,Toto-1.0,0.5,0.5,0.5,0.0,0.0,0.0
139
- Toto-1.0,TabPFN-TS,0.583,0.333,0.833,-0.035,-0.158,0.074
140
- Toto-1.0,TimesFM-2.5,0.583,0.333,0.833,-0.019,-0.113,0.05
141
- Toto-1.0,Toto-2.0-4m,0.583,0.333,0.833,-0.004,-0.072,0.047
142
- Toto-1.0,Stat. Ensemble,0.583,0.333,0.833,0.002,-0.131,0.109
143
- Toto-1.0,Chronos-Bolt,0.833,0.667,1.0,0.04,0.003,0.076
144
- Toto-1.0,AutoETS,0.667,0.417,0.917,0.021,-0.072,0.095
145
- Toto-1.0,Seasonal Naive,0.833,0.583,1.0,0.381,0.237,0.506
146
- TabPFN-TS,TiRex-2,0.333,0.083,0.583,-0.098,-0.197,-0.016
147
- TabPFN-TS,Toto-2.0-1B,0.167,0.0,0.417,-0.037,-0.147,0.085
148
- TabPFN-TS,Toto-2.0-2.5B,0.25,0.0,0.5,-0.045,-0.135,0.059
149
- TabPFN-TS,Toto-2.0-313m,0.333,0.083,0.583,-0.033,-0.125,0.065
150
- TabPFN-TS,TiRex,0.25,0.0,0.5,-0.033,-0.126,0.056
151
- TabPFN-TS,Toto-2.0-22m,0.417,0.167,0.667,-0.037,-0.127,0.046
152
- TabPFN-TS,Chronos-2,0.333,0.083,0.583,-0.013,-0.105,0.082
153
- TabPFN-TS,FlowState,0.333,0.083,0.583,-0.012,-0.082,0.066
154
- TabPFN-TS,Toto-1.0,0.417,0.167,0.667,0.034,-0.08,0.137
155
- TabPFN-TS,TabPFN-TS,0.5,0.5,0.5,0.0,0.0,0.0
156
- TabPFN-TS,TimesFM-2.5,0.5,0.25,0.75,0.015,-0.08,0.115
157
- TabPFN-TS,Toto-2.0-4m,0.583,0.331,0.833,0.03,-0.068,0.123
158
- TabPFN-TS,Stat. Ensemble,0.5,0.25,0.833,0.036,-0.043,0.12
159
- TabPFN-TS,Chronos-Bolt,0.583,0.331,0.833,0.072,-0.043,0.173
160
- TabPFN-TS,AutoETS,0.75,0.5,1.0,0.054,-0.021,0.112
161
- TabPFN-TS,Seasonal Naive,1.0,1.0,1.0,0.402,0.302,0.502
162
- TimesFM-2.5,TiRex-2,0.083,0.0,0.25,-0.115,-0.199,-0.052
163
- TimesFM-2.5,Toto-2.0-1B,0.25,0.083,0.5,-0.054,-0.101,-0.008
164
- TimesFM-2.5,Toto-2.0-2.5B,0.25,0.0,0.5,-0.062,-0.108,-0.023
165
- TimesFM-2.5,Toto-2.0-313m,0.25,0.0,0.5,-0.049,-0.094,-0.006
166
- TimesFM-2.5,TiRex,0.167,0.0,0.333,-0.049,-0.092,-0.005
167
- TimesFM-2.5,Toto-2.0-22m,0.25,0.0,0.5,-0.053,-0.146,0.027
168
- TimesFM-2.5,Chronos-2,0.333,0.083,0.667,-0.029,-0.064,0.008
169
- TimesFM-2.5,FlowState,0.417,0.167,0.667,-0.028,-0.185,0.066
170
- TimesFM-2.5,Toto-1.0,0.417,0.167,0.667,0.019,-0.052,0.102
171
- TimesFM-2.5,TabPFN-TS,0.5,0.25,0.75,-0.016,-0.13,0.074
172
- TimesFM-2.5,TimesFM-2.5,0.5,0.5,0.5,0.0,0.0,0.0
173
- TimesFM-2.5,Toto-2.0-4m,0.5,0.25,0.75,0.015,-0.091,0.11
174
- TimesFM-2.5,Stat. Ensemble,0.667,0.417,0.917,0.021,-0.12,0.113
175
- TimesFM-2.5,Chronos-Bolt,0.583,0.333,0.833,0.058,-0.015,0.143
176
- TimesFM-2.5,AutoETS,0.75,0.5,1.0,0.04,-0.045,0.104
177
- TimesFM-2.5,Seasonal Naive,0.917,0.75,1.0,0.393,0.257,0.517
178
- Toto-2.0-4m,TiRex-2,0.083,0.0,0.25,-0.132,-0.238,-0.051
179
- Toto-2.0-4m,Toto-2.0-1B,0.167,0.0,0.417,-0.069,-0.172,0.048
180
- Toto-2.0-4m,Toto-2.0-2.5B,0.167,0.0,0.417,-0.078,-0.182,0.015
181
- Toto-2.0-4m,Toto-2.0-313m,0.167,0.0,0.417,-0.064,-0.156,0.019
182
- Toto-2.0-4m,TiRex,0.25,0.0,0.5,-0.064,-0.147,0.009
183
- Toto-2.0-4m,Toto-2.0-22m,0.0,0.0,0.0,-0.069,-0.101,-0.043
184
- Toto-2.0-4m,Chronos-2,0.333,0.083,0.585,-0.044,-0.156,0.045
185
- Toto-2.0-4m,FlowState,0.5,0.25,0.75,-0.043,-0.135,0.037
186
- Toto-2.0-4m,Toto-1.0,0.417,0.167,0.667,0.004,-0.049,0.067
187
- Toto-2.0-4m,TabPFN-TS,0.417,0.167,0.669,-0.031,-0.14,0.063
188
- Toto-2.0-4m,TimesFM-2.5,0.5,0.25,0.75,-0.015,-0.124,0.083
189
- Toto-2.0-4m,Toto-2.0-4m,0.5,0.5,0.5,0.0,0.0,0.0
190
- Toto-2.0-4m,Stat. Ensemble,0.667,0.417,0.917,0.006,-0.12,0.107
191
- Toto-2.0-4m,Chronos-Bolt,0.75,0.5,1.0,0.044,0.007,0.091
192
- Toto-2.0-4m,AutoETS,0.75,0.5,1.0,0.025,-0.068,0.081
193
- Toto-2.0-4m,Seasonal Naive,0.917,0.75,1.0,0.384,0.244,0.506
194
- Stat. Ensemble,TiRex-2,0.167,0.0,0.417,-0.139,-0.244,-0.042
195
- Stat. Ensemble,Toto-2.0-1B,0.25,0.0,0.5,-0.076,-0.232,0.093
196
- Stat. Ensemble,Toto-2.0-2.5B,0.25,0.0,0.5,-0.084,-0.226,0.061
197
- Stat. Ensemble,Toto-2.0-313m,0.25,0.0,0.5,-0.071,-0.205,0.069
198
- Stat. Ensemble,TiRex,0.25,0.0,0.5,-0.071,-0.192,0.052
199
- Stat. Ensemble,Toto-2.0-22m,0.333,0.083,0.583,-0.075,-0.192,0.031
200
- Stat. Ensemble,Chronos-2,0.167,0.0,0.417,-0.05,-0.164,0.076
201
- Stat. Ensemble,FlowState,0.417,0.167,0.667,-0.049,-0.135,0.025
202
- Stat. Ensemble,Toto-1.0,0.417,0.167,0.667,-0.002,-0.122,0.116
203
- Stat. Ensemble,TabPFN-TS,0.5,0.167,0.75,-0.037,-0.136,0.042
204
- Stat. Ensemble,TimesFM-2.5,0.333,0.083,0.583,-0.021,-0.127,0.107
205
- Stat. Ensemble,Toto-2.0-4m,0.333,0.083,0.583,-0.006,-0.12,0.107
206
- Stat. Ensemble,Stat. Ensemble,0.5,0.5,0.5,0.0,0.0,0.0
207
- Stat. Ensemble,Chronos-Bolt,0.417,0.167,0.667,0.038,-0.083,0.155
208
- Stat. Ensemble,AutoETS,0.417,0.167,0.667,0.019,-0.068,0.095
209
- Stat. Ensemble,Seasonal Naive,1.0,1.0,1.0,0.38,0.283,0.482
210
- Chronos-Bolt,TiRex-2,0.0,0.0,0.0,-0.184,-0.312,-0.088
211
- Chronos-Bolt,Toto-2.0-1B,0.083,0.0,0.25,-0.118,-0.219,-0.032
212
- Chronos-Bolt,Toto-2.0-2.5B,0.167,0.0,0.417,-0.127,-0.224,-0.051
213
- Chronos-Bolt,Toto-2.0-313m,0.167,0.0,0.417,-0.113,-0.192,-0.051
214
- Chronos-Bolt,TiRex,0.083,0.0,0.25,-0.113,-0.2,-0.049
215
- Chronos-Bolt,Toto-2.0-22m,0.083,0.0,0.25,-0.118,-0.172,-0.068
216
- Chronos-Bolt,Chronos-2,0.333,0.083,0.583,-0.092,-0.2,-0.014
217
- Chronos-Bolt,FlowState,0.417,0.167,0.668,-0.091,-0.23,0.021
218
- Chronos-Bolt,Toto-1.0,0.167,0.0,0.333,-0.041,-0.083,-0.003
219
- Chronos-Bolt,TabPFN-TS,0.417,0.167,0.669,-0.078,-0.208,0.042
220
- Chronos-Bolt,TimesFM-2.5,0.417,0.167,0.667,-0.061,-0.167,0.014
221
- Chronos-Bolt,Toto-2.0-4m,0.25,0.0,0.5,-0.046,-0.101,-0.007
222
- Chronos-Bolt,Stat. Ensemble,0.583,0.333,0.833,-0.04,-0.184,0.077
223
- Chronos-Bolt,Chronos-Bolt,0.5,0.5,0.5,0.0,0.0,0.0
224
- Chronos-Bolt,AutoETS,0.583,0.333,0.833,-0.019,-0.125,0.057
225
- Chronos-Bolt,Seasonal Naive,0.833,0.583,1.0,0.355,0.212,0.48
226
- AutoETS,TiRex-2,0.083,0.0,0.25,-0.161,-0.26,-0.087
227
- AutoETS,Toto-2.0-1B,0.25,0.0,0.5,-0.097,-0.192,0.019
228
- AutoETS,Toto-2.0-2.5B,0.25,0.0,0.5,-0.106,-0.186,-0.016
229
- AutoETS,Toto-2.0-313m,0.25,0.0,0.5,-0.092,-0.165,-0.01
230
- AutoETS,TiRex,0.167,0.0,0.417,-0.092,-0.169,-0.018
231
- AutoETS,Toto-2.0-22m,0.083,0.0,0.25,-0.096,-0.149,-0.02
232
- AutoETS,Chronos-2,0.083,0.0,0.25,-0.071,-0.126,-0.004
233
- AutoETS,FlowState,0.333,0.083,0.583,-0.07,-0.17,0.018
234
- AutoETS,Toto-1.0,0.333,0.083,0.583,-0.022,-0.104,0.067
235
- AutoETS,TabPFN-TS,0.25,0.0,0.5,-0.057,-0.126,0.021
236
- AutoETS,TimesFM-2.5,0.25,0.0,0.5,-0.041,-0.116,0.043
237
- AutoETS,Toto-2.0-4m,0.25,0.0,0.5,-0.026,-0.088,0.063
238
- AutoETS,Stat. Ensemble,0.583,0.333,0.833,-0.02,-0.105,0.064
239
- AutoETS,Chronos-Bolt,0.417,0.167,0.667,0.019,-0.06,0.111
240
- AutoETS,AutoETS,0.5,0.5,0.5,0.0,0.0,0.0
241
- AutoETS,Seasonal Naive,0.917,0.75,1.0,0.368,0.243,0.486
242
- Seasonal Naive,TiRex-2,0.0,0.0,0.0,-0.836,-1.325,-0.508
243
- Seasonal Naive,Toto-2.0-1B,0.083,0.0,0.25,-0.735,-1.226,-0.367
244
- Seasonal Naive,Toto-2.0-2.5B,0.083,0.0,0.25,-0.748,-1.202,-0.414
245
- Seasonal Naive,Toto-2.0-313m,0.083,0.0,0.25,-0.727,-1.169,-0.398
246
- Seasonal Naive,TiRex,0.0,0.0,0.0,-0.727,-1.204,-0.402
247
- Seasonal Naive,Toto-2.0-22m,0.083,0.0,0.25,-0.734,-1.169,-0.429
248
- Seasonal Naive,Chronos-2,0.083,0.0,0.25,-0.694,-1.116,-0.391
249
- Seasonal Naive,FlowState,0.083,0.0,0.25,-0.692,-1.082,-0.407
250
- Seasonal Naive,Toto-1.0,0.167,0.0,0.417,-0.616,-1.022,-0.311
251
- Seasonal Naive,TabPFN-TS,0.0,0.0,0.0,-0.672,-1.007,-0.432
252
- Seasonal Naive,TimesFM-2.5,0.083,0.0,0.25,-0.647,-1.071,-0.346
253
- Seasonal Naive,Toto-2.0-4m,0.083,0.0,0.25,-0.622,-1.024,-0.323
254
- Seasonal Naive,Stat. Ensemble,0.0,0.0,0.0,-0.613,-0.931,-0.394
255
- Seasonal Naive,Chronos-Bolt,0.167,0.0,0.417,-0.551,-0.924,-0.269
256
- Seasonal Naive,AutoETS,0.083,0.0,0.25,-0.581,-0.947,-0.321
257
- Seasonal Naive,Seasonal Naive,0.5,0.5,0.5,0.0,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_energy/leaderboard_MASE.csv DELETED
@@ -1,29 +0,0 @@
1
- model_name,win_rate,skill_score,median_training_time_s_per100,median_inference_time_s_per100,training_corpus_overlap,num_failures
2
- Chronos-2,84.75783475783474,35.398351985937104,0.0,3.4120501715909093,0.0,0.0
3
- Toto-2.0-1B,77.35042735042735,27.64063711794009,0.0,3.1623076374715904,0.0,0.0
4
- Toto-2.0-2.5B,77.20797720797721,27.403361161284135,0.0,6.4650776003125,0.0,0.0
5
- TabPFN-TS-3,75.92592592592594,34.00489490838103,0.0,822.0435218492969,0.0,0.0
6
- TiRex-2,75.7834757834758,32.34547171146631,0.0,1.0366915774648078,0.0,0.0
7
- Toto-2.0-313m,74.92877492877491,27.247610226794162,0.0,1.5456846913541669,0.0,0.0
8
- TiRex,66.52421652421651,25.111125954829205,0.0,1.3324642875,0.038461538461538464,0.0
9
- TabPFN-TS,64.52991452991454,29.948417313219487,0.0,308.48925294219475,0.0,0.0
10
- TimesFM-2.5,63.817663817663814,24.470577229456005,0.0,35.73234459616477,0.15384615384615385,0.0
11
- Toto-2.0-22m,63.10541310541311,25.222517255488896,0.0,0.7798815821022727,0.0,0.0
12
- Chronos-Bolt,60.25641025641026,24.79493112223894,0.0,1.1602838375000002,0.0,0.0
13
- FlowState,58.974358974358964,24.74097538777954,0.0,3.7859752799626865,0.15384615384615385,0.0
14
- Moirai-2.0,57.692307692307686,23.276855703905884,0.0,2.549116965535714,0.3076923076923077,0.0
15
- Sundial-Base,54.98575498575499,25.973733886600225,0.0,8.734264116875,0.038461538461538464,0.0
16
- Toto-1.0,54.98575498575499,22.17352687153604,0.0,64.32606581959577,0.15384615384615385,0.0
17
- Toto-2.0-4m,54.7008547008547,21.834602126597346,0.0,0.7024468823376624,0.0,0.0
18
- TFT,47.86324786324787,24.332626654075018,7067.210990843215,5.868696277689394,0.0,0.0
19
- DeepAR,42.52136752136752,20.515410969632153,13498.838423148572,8.687442574285715,0.0,11.538461538461538
20
- PatchTST,39.743589743589745,18.853426287300014,7221.856288165601,6.349855852499999,0.0,0.0
21
- CatBoost,39.60113960113959,17.15191259995018,498.1807509,5.586804820681818,0.0,0.0
22
- LightGBM,36.75213675213675,14.854815383201469,47.29828941238095,4.303395228143939,0.0,0.0
23
- Stat. Ensemble,27.27920227920228,4.447406228151163,0.0,2051.548594149911,0.0,7.6923076923076925
24
- AutoARIMA,26.139601139601137,2.212327431466543,0.0,1885.5145473599553,0.0,7.6923076923076925
25
- Seasonal Naive,21.652421652421648,0.0,0.0,1.042975715,0.0,0.0
26
- AutoTheta,20.085470085470085,1.1815956958414753,0.0,6.6345268946875,0.0,0.0
27
- AutoETS,15.242165242165239,-34.97549884253801,0.0,13.387819541051137,0.0,0.0
28
- Naive,12.606837606837603,-44.773921203129,0.0,1.0805920684374999,0.0,0.0
29
- Drift,4.985754985754986,-52.29912347479908,0.0,1.081847729375,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_energy/leaderboard_SQL.csv DELETED
@@ -1,29 +0,0 @@
1
- model_name,win_rate,skill_score,median_training_time_s_per100,median_inference_time_s_per100,training_corpus_overlap,num_failures
2
- Chronos-2,85.6125356125356,43.696037899366445,0.0,3.4120501715909093,0.0,0.0
3
- Toto-2.0-1B,81.05413105413105,37.19233498724061,0.0,3.1623076374715904,0.0,0.0
4
- TiRex-2,80.34188034188034,40.955040522328076,0.0,1.0366915774648078,0.0,0.0
5
- Toto-2.0-2.5B,80.34188034188034,36.942973998246586,0.0,6.4650776003125,0.0,0.0
6
- TabPFN-TS-3,77.92022792022793,42.12648526492014,0.0,822.0435218492969,0.0,0.0
7
- Toto-2.0-313m,77.4928774928775,36.69282240000613,0.0,1.5456846913541669,0.0,0.0
8
- TiRex,70.94017094017097,34.44791484004565,0.0,1.3324642875,0.038461538461538464,0.0
9
- Toto-2.0-22m,68.23361823361823,34.72199927167168,0.0,0.7798815821022727,0.0,0.0
10
- TabPFN-TS,68.0911680911681,38.63838178079146,0.0,308.48925294219475,0.0,0.0
11
- TimesFM-2.5,64.81481481481481,33.040194549839576,0.0,35.73234459616477,0.15384615384615385,0.0
12
- FlowState,60.25641025641024,32.4100685185642,0.0,3.7859752799626865,0.15384615384615385,0.0
13
- Chronos-Bolt,58.974358974358985,32.881689430291104,0.0,1.1602838375000002,0.0,0.0
14
- Moirai-2.0,57.83475783475783,31.52282472603488,0.0,2.549116965535714,0.3076923076923077,0.0
15
- Toto-2.0-4m,57.12250712250713,31.473352334477845,0.0,0.7024468823376624,0.0,0.0
16
- Toto-1.0,56.41025641025641,31.112045696230428,0.0,64.32606581959577,0.15384615384615385,0.0
17
- TFT,52.70655270655271,32.085719324643314,7067.210990843215,5.868696277689394,0.0,0.0
18
- Sundial-Base,45.15669515669515,28.52842311909273,0.0,8.734264116875,0.038461538461538464,0.0
19
- DeepAR,43.94586894586894,26.66949092254881,13498.838423148572,8.687442574285715,0.0,11.538461538461538
20
- PatchTST,43.01994301994302,25.60679591439182,7221.856288165601,6.349855852499999,0.0,0.0
21
- AutoARIMA,29.700854700854695,9.139931178596383,0.0,1885.5145473599553,0.0,7.6923076923076925
22
- Stat. Ensemble,27.136752136752136,6.196332966589502,0.0,2051.548594149911,0.0,7.6923076923076925
23
- CatBoost,25.64102564102563,8.874064288365757,498.1807509,5.586804820681818,0.0,0.0
24
- LightGBM,22.649572649572647,6.34745033907752,47.29828941238095,4.303395228143939,0.0,0.0
25
- Seasonal Naive,19.08831908831909,0.0,0.0,1.042975715,0.0,0.0
26
- AutoETS,17.66381766381766,-30.210229740669558,0.0,13.387819541051137,0.0,0.0
27
- AutoTheta,15.811965811965809,-10.643501874241924,0.0,6.6345268946875,0.0,0.0
28
- Naive,8.903133903133902,-60.57154490567112,0.0,1.0805920684374999,0.0,0.0
29
- Drift,3.133903133903134,-67.3016518958006,0.0,1.081847729375,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_energy/leaderboard_WAPE.csv DELETED
@@ -1,29 +0,0 @@
1
- model_name,win_rate,skill_score,median_training_time_s_per100,median_inference_time_s_per100,training_corpus_overlap,num_failures
2
- Chronos-2,82.62108262108262,37.557901536977845,0.0,3.4120501715909093,0.0,0.0
3
- Toto-2.0-1B,76.06837606837607,31.032868019309202,0.0,3.1623076374715904,0.0,0.0
4
- Toto-2.0-313m,75.64102564102564,30.705322754813878,0.0,1.5456846913541669,0.0,0.0
5
- Toto-2.0-2.5B,73.78917378917377,30.308651726585033,0.0,6.4650776003125,0.0,0.0
6
- TiRex-2,71.36752136752136,34.43124058342566,0.0,1.0366915774648078,0.0,0.0
7
- TabPFN-TS-3,70.7977207977208,34.61666637481101,0.0,822.0435218492969,0.0,0.0
8
- Toto-2.0-22m,65.24216524216523,28.863859566477203,0.0,0.7798815821022727,0.0,0.0
9
- TiRex,62.25071225071225,27.322662354204475,0.0,1.3324642875,0.038461538461538464,0.0
10
- TimesFM-2.5,60.68376068376068,26.65794953458317,0.0,35.73234459616477,0.15384615384615385,0.0
11
- TabPFN-TS,60.541310541310544,30.36322876478197,0.0,308.48925294219475,0.0,0.0
12
- Chronos-Bolt,57.122507122507116,26.606852502371968,0.0,1.1602838375000002,0.0,0.0
13
- Moirai-2.0,56.837606837606835,25.99988075597758,0.0,2.549116965535714,0.3076923076923077,0.0
14
- FlowState,53.84615384615385,26.89142712985859,0.0,3.7859752799626865,0.15384615384615385,0.0
15
- Sundial-Base,53.13390313390314,28.265544600882,0.0,8.734264116875,0.038461538461538464,0.0
16
- Toto-1.0,51.85185185185185,24.207524581618266,0.0,64.32606581959577,0.15384615384615385,0.0
17
- TFT,50.142450142450144,26.59412613673687,7067.210990843215,5.868696277689394,0.0,0.0
18
- Toto-2.0-4m,49.43019943019942,23.82250300845572,0.0,0.7024468823376624,0.0,0.0
19
- PatchTST,43.73219373219374,20.65325504182872,7221.856288165601,6.349855852499999,0.0,0.0
20
- DeepAR,41.95156695156697,21.82047445619971,13498.838423148572,8.687442574285715,0.0,11.538461538461538
21
- LightGBM,41.3105413105413,20.63835609604817,47.29828941238095,4.303395228143939,0.0,0.0
22
- CatBoost,40.028490028490026,20.174610152005823,498.1807509,5.586804820681818,0.0,0.0
23
- Stat. Ensemble,33.97435897435897,8.430993583997726,0.0,2051.548594149911,0.0,7.6923076923076925
24
- AutoARIMA,25.28490028490028,3.8316800542679386,0.0,1885.5145473599553,0.0,7.6923076923076925
25
- AutoETS,22.93447293447294,-24.06197476117884,0.0,13.387819541051137,0.0,0.0
26
- Naive,22.578347578347575,-29.595393529303713,0.0,1.0805920684374999,0.0,0.0
27
- AutoTheta,22.222222222222218,4.200265666572001,0.0,6.6345268946875,0.0,0.0
28
- Seasonal Naive,20.08547008547008,0.0,0.0,1.042975715,0.0,0.0
29
- Drift,14.529914529914533,-36.91555319026642,0.0,1.081847729375,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_energy/leaderboard_WQL.csv DELETED
@@ -1,29 +0,0 @@
1
- model_name,win_rate,skill_score,median_training_time_s_per100,median_inference_time_s_per100,training_corpus_overlap,num_failures
2
- Chronos-2,85.32763532763533,45.99295404026385,0.0,3.4120501715909093,0.0,0.0
3
- Toto-2.0-1B,82.6210826210826,40.95974538328001,0.0,3.1623076374715904,0.0,0.0
4
- Toto-2.0-2.5B,80.19943019943021,40.25120913531922,0.0,6.4650776003125,0.0,0.0
5
- Toto-2.0-313m,80.1994301994302,40.431908864449696,0.0,1.5456846913541669,0.0,0.0
6
- TiRex-2,78.20512820512819,43.430525812131435,0.0,1.0366915774648078,0.0,0.0
7
- TabPFN-TS-3,74.92877492877494,43.103980194426214,0.0,822.0435218492969,0.0,0.0
8
- Toto-2.0-22m,70.37037037037037,38.501099243397576,0.0,0.7798815821022727,0.0,0.0
9
- TiRex,68.66096866096866,37.015923795326046,0.0,1.3324642875,0.038461538461538464,0.0
10
- TabPFN-TS,66.66666666666669,39.634990899313024,0.0,308.48925294219475,0.0,0.0
11
- TimesFM-2.5,62.96296296296296,35.74711028493935,0.0,35.73234459616477,0.15384615384615385,0.0
12
- FlowState,58.68945868945868,35.238708603025636,0.0,3.7859752799626865,0.15384615384615385,0.0
13
- Chronos-Bolt,58.4045584045584,35.346534587472554,0.0,1.1602838375000002,0.0,0.0
14
- Moirai-2.0,57.692307692307686,34.54029716114274,0.0,2.549116965535714,0.3076923076923077,0.0
15
- Toto-2.0-4m,55.55555555555555,33.916952411684484,0.0,0.7024468823376624,0.0,0.0
16
- Toto-1.0,54.84330484330483,33.68160197994784,0.0,64.32606581959577,0.15384615384615385,0.0
17
- TFT,53.27635327635329,34.858358688960024,7067.210990843215,5.868696277689394,0.0,0.0
18
- Sundial-Base,45.29914529914529,31.420585268607393,0.0,8.734264116875,0.038461538461538464,0.0
19
- PatchTST,44.58689458689459,28.17762114987711,7221.856288165601,6.349855852499999,0.0,0.0
20
- DeepAR,42.8062678062678,28.82551876839535,13498.838423148572,8.687442574285715,0.0,11.538461538461538
21
- LightGBM,30.484330484330478,13.804281918946282,47.29828941238095,4.303395228143939,0.0,0.0
22
- Stat. Ensemble,29.558404558404554,11.001763956139254,0.0,2051.548594149911,0.0,7.6923076923076925
23
- AutoARIMA,28.133903133903132,10.956865003323434,0.0,1885.5145473599553,0.0,7.6923076923076925
24
- CatBoost,26.638176638176635,13.30060154143199,498.1807509,5.586804820681818,0.0,0.0
25
- Seasonal Naive,16.80911680911681,0.0,0.0,1.042975715,0.0,0.0
26
- AutoETS,16.666666666666664,-24.269495322854407,0.0,13.387819541051137,0.0,0.0
27
- AutoTheta,16.23931623931624,-4.896832310667398,0.0,6.6345268946875,0.0,0.0
28
- Naive,9.615384615384617,-50.976730476610335,0.0,1.0805920684374999,0.0,0.0
29
- Drift,4.5584045584045585,-57.44553171159505,0.0,1.081847729375,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_energy/pairwise_MASE.csv DELETED
@@ -1,257 +0,0 @@
1
- model_1,model_2,win_rate,win_rate_lower,win_rate_upper,skill_score,skill_score_lower,skill_score_upper
2
- Chronos-2,Chronos-2,0.5,0.5,0.5,0.0,0.0,0.0
3
- Chronos-2,Toto-2.0-2.5B,0.654,0.462,0.808,0.11,0.043,0.177
4
- Chronos-2,Toto-2.0-1B,0.577,0.385,0.769,0.107,0.04,0.174
5
- Chronos-2,Toto-2.0-313m,0.654,0.462,0.846,0.112,0.04,0.182
6
- Chronos-2,TiRex-2,0.577,0.385,0.769,0.045,0.001,0.092
7
- Chronos-2,TabPFN-TS-3,0.654,0.462,0.846,0.021,-0.014,0.058
8
- Chronos-2,TiRex,0.769,0.615,0.923,0.137,0.066,0.203
9
- Chronos-2,TabPFN-TS,0.769,0.615,0.923,0.078,0.038,0.118
10
- Chronos-2,TimesFM-2.5,0.769,0.577,0.923,0.145,0.072,0.212
11
- Chronos-2,Toto-2.0-22m,0.885,0.769,1.0,0.136,0.072,0.201
12
- Chronos-2,FlowState,0.846,0.692,0.962,0.142,0.073,0.202
13
- Chronos-2,Chronos-Bolt,0.962,0.885,1.0,0.141,0.078,0.202
14
- Chronos-2,Moirai-2.0,0.923,0.808,1.0,0.158,0.092,0.222
15
- Chronos-2,Toto-1.0,0.846,0.692,0.962,0.17,0.105,0.237
16
- Chronos-2,Sundial-Base,0.846,0.692,0.962,0.127,0.069,0.195
17
- Chronos-2,Seasonal Naive,0.962,0.885,1.0,0.354,0.278,0.422
18
- Toto-2.0-2.5B,Chronos-2,0.346,0.192,0.538,-0.124,-0.214,-0.045
19
- Toto-2.0-2.5B,Toto-2.0-2.5B,0.5,0.5,0.5,0.0,0.0,0.0
20
- Toto-2.0-2.5B,Toto-2.0-1B,0.5,0.346,0.692,-0.003,-0.011,0.004
21
- Toto-2.0-2.5B,Toto-2.0-313m,0.615,0.423,0.808,0.002,-0.013,0.016
22
- Toto-2.0-2.5B,TiRex-2,0.5,0.308,0.692,-0.073,-0.162,-0.001
23
- Toto-2.0-2.5B,TabPFN-TS-3,0.462,0.269,0.654,-0.1,-0.208,-0.003
24
- Toto-2.0-2.5B,TiRex,0.692,0.5,0.846,0.031,0.007,0.055
25
- Toto-2.0-2.5B,TabPFN-TS,0.654,0.462,0.846,-0.036,-0.133,0.042
26
- Toto-2.0-2.5B,TimesFM-2.5,0.692,0.5,0.846,0.039,0.01,0.071
27
- Toto-2.0-2.5B,Toto-2.0-22m,0.808,0.654,0.962,0.029,0.016,0.042
28
- Toto-2.0-2.5B,FlowState,0.808,0.654,0.923,0.035,-0.0,0.067
29
- Toto-2.0-2.5B,Chronos-Bolt,0.846,0.692,0.962,0.035,0.005,0.062
30
- Toto-2.0-2.5B,Moirai-2.0,0.846,0.692,0.962,0.054,0.028,0.083
31
- Toto-2.0-2.5B,Toto-1.0,0.808,0.654,0.962,0.067,0.04,0.101
32
- Toto-2.0-2.5B,Sundial-Base,0.769,0.615,0.923,0.019,-0.071,0.108
33
- Toto-2.0-2.5B,Seasonal Naive,0.962,0.885,1.0,0.274,0.211,0.335
34
- Toto-2.0-1B,Chronos-2,0.423,0.231,0.615,-0.12,-0.211,-0.042
35
- Toto-2.0-1B,Toto-2.0-2.5B,0.5,0.308,0.654,0.003,-0.004,0.011
36
- Toto-2.0-1B,Toto-2.0-1B,0.5,0.5,0.5,0.0,0.0,0.0
37
- Toto-2.0-1B,Toto-2.0-313m,0.5,0.308,0.692,0.005,-0.008,0.019
38
- Toto-2.0-1B,TiRex-2,0.615,0.423,0.808,-0.07,-0.162,0.004
39
- Toto-2.0-1B,TabPFN-TS-3,0.423,0.231,0.615,-0.096,-0.205,0.001
40
- Toto-2.0-1B,TiRex,0.654,0.462,0.808,0.034,0.011,0.059
41
- Toto-2.0-1B,TabPFN-TS,0.615,0.423,0.808,-0.033,-0.13,0.048
42
- Toto-2.0-1B,TimesFM-2.5,0.769,0.577,0.923,0.042,0.012,0.074
43
- Toto-2.0-1B,Toto-2.0-22m,0.846,0.692,0.962,0.032,0.02,0.046
44
- Toto-2.0-1B,FlowState,0.769,0.615,0.923,0.039,0.004,0.069
45
- Toto-2.0-1B,Chronos-Bolt,0.846,0.692,0.962,0.038,0.007,0.066
46
- Toto-2.0-1B,Moirai-2.0,0.846,0.692,0.962,0.057,0.034,0.083
47
- Toto-2.0-1B,Toto-1.0,0.808,0.654,0.923,0.07,0.043,0.102
48
- Toto-2.0-1B,Sundial-Base,0.731,0.577,0.885,0.023,-0.068,0.11
49
- Toto-2.0-1B,Seasonal Naive,0.923,0.808,1.0,0.276,0.21,0.34
50
- Toto-2.0-313m,Chronos-2,0.346,0.154,0.538,-0.126,-0.222,-0.042
51
- Toto-2.0-313m,Toto-2.0-2.5B,0.385,0.192,0.577,-0.002,-0.016,0.013
52
- Toto-2.0-313m,Toto-2.0-1B,0.5,0.308,0.692,-0.005,-0.019,0.008
53
- Toto-2.0-313m,Toto-2.0-313m,0.5,0.5,0.5,0.0,0.0,0.0
54
- Toto-2.0-313m,TiRex-2,0.5,0.308,0.692,-0.075,-0.172,0.001
55
- Toto-2.0-313m,TabPFN-TS-3,0.462,0.269,0.654,-0.102,-0.213,-0.002
56
- Toto-2.0-313m,TiRex,0.615,0.423,0.808,0.029,0.011,0.048
57
- Toto-2.0-313m,TabPFN-TS,0.654,0.462,0.846,-0.039,-0.142,0.043
58
- Toto-2.0-313m,TimesFM-2.5,0.692,0.5,0.847,0.037,0.012,0.062
59
- Toto-2.0-313m,Toto-2.0-22m,0.731,0.538,0.885,0.027,0.014,0.041
60
- Toto-2.0-313m,FlowState,0.769,0.615,0.923,0.033,0.002,0.062
61
- Toto-2.0-313m,Chronos-Bolt,0.731,0.576,0.885,0.033,0.004,0.06
62
- Toto-2.0-313m,Moirai-2.0,0.769,0.577,0.923,0.052,0.025,0.08
63
- Toto-2.0-313m,Toto-1.0,0.731,0.538,0.885,0.065,0.037,0.096
64
- Toto-2.0-313m,Sundial-Base,0.808,0.654,0.962,0.017,-0.072,0.099
65
- Toto-2.0-313m,Seasonal Naive,0.923,0.808,1.0,0.272,0.206,0.336
66
- TiRex-2,Chronos-2,0.423,0.231,0.615,-0.047,-0.101,-0.001
67
- TiRex-2,Toto-2.0-2.5B,0.5,0.308,0.692,0.068,0.001,0.14
68
- TiRex-2,Toto-2.0-1B,0.385,0.192,0.577,0.065,-0.004,0.139
69
- TiRex-2,Toto-2.0-313m,0.5,0.308,0.692,0.07,-0.001,0.147
70
- TiRex-2,TiRex-2,0.5,0.5,0.5,0.0,0.0,0.0
71
- TiRex-2,TabPFN-TS-3,0.5,0.308,0.692,-0.025,-0.087,0.028
72
- TiRex-2,TiRex,0.769,0.615,0.923,0.097,0.031,0.165
73
- TiRex-2,TabPFN-TS,0.654,0.462,0.846,0.034,-0.02,0.085
74
- TiRex-2,TimesFM-2.5,0.654,0.462,0.808,0.104,0.032,0.177
75
- TiRex-2,Toto-2.0-22m,0.577,0.385,0.769,0.095,0.029,0.163
76
- TiRex-2,FlowState,0.731,0.577,0.885,0.101,0.03,0.169
77
- TiRex-2,Chronos-Bolt,0.654,0.462,0.846,0.1,0.031,0.175
78
- TiRex-2,Moirai-2.0,0.692,0.538,0.846,0.118,0.055,0.181
79
- TiRex-2,Toto-1.0,0.692,0.538,0.846,0.131,0.065,0.2
80
- TiRex-2,Sundial-Base,0.808,0.654,0.962,0.086,0.006,0.164
81
- TiRex-2,Seasonal Naive,0.962,0.885,1.0,0.323,0.243,0.395
82
- TabPFN-TS-3,Chronos-2,0.346,0.154,0.538,-0.022,-0.062,0.013
83
- TabPFN-TS-3,Toto-2.0-2.5B,0.538,0.346,0.731,0.091,0.003,0.172
84
- TabPFN-TS-3,Toto-2.0-1B,0.577,0.385,0.769,0.088,-0.001,0.17
85
- TabPFN-TS-3,Toto-2.0-313m,0.538,0.346,0.731,0.093,0.002,0.175
86
- TabPFN-TS-3,TiRex-2,0.5,0.308,0.692,0.025,-0.029,0.08
87
- TabPFN-TS-3,TabPFN-TS-3,0.5,0.5,0.5,0.0,0.0,0.0
88
- TabPFN-TS-3,TiRex,0.538,0.346,0.731,0.119,0.032,0.197
89
- TabPFN-TS-3,TabPFN-TS,0.731,0.577,0.885,0.058,0.011,0.101
90
- TabPFN-TS-3,TimesFM-2.5,0.692,0.5,0.846,0.126,0.038,0.206
91
- TabPFN-TS-3,Toto-2.0-22m,0.615,0.423,0.77,0.117,0.034,0.194
92
- TabPFN-TS-3,FlowState,0.692,0.5,0.846,0.123,0.036,0.198
93
- TabPFN-TS-3,Chronos-Bolt,0.654,0.462,0.809,0.122,0.043,0.198
94
- TabPFN-TS-3,Moirai-2.0,0.654,0.462,0.808,0.14,0.054,0.22
95
- TabPFN-TS-3,Toto-1.0,0.692,0.5,0.846,0.152,0.072,0.227
96
- TabPFN-TS-3,Sundial-Base,0.769,0.615,0.923,0.108,0.038,0.185
97
- TabPFN-TS-3,Seasonal Naive,0.962,0.885,1.0,0.34,0.265,0.41
98
- TiRex,Chronos-2,0.231,0.077,0.385,-0.159,-0.255,-0.07
99
- TiRex,Toto-2.0-2.5B,0.308,0.154,0.5,-0.032,-0.059,-0.007
100
- TiRex,Toto-2.0-1B,0.346,0.192,0.538,-0.035,-0.063,-0.011
101
- TiRex,Toto-2.0-313m,0.385,0.192,0.577,-0.029,-0.051,-0.011
102
- TiRex,TiRex-2,0.231,0.077,0.385,-0.107,-0.198,-0.032
103
- TiRex,TabPFN-TS-3,0.462,0.269,0.654,-0.135,-0.246,-0.034
104
- TiRex,TiRex,0.5,0.5,0.5,0.0,0.0,0.0
105
- TiRex,TabPFN-TS,0.5,0.308,0.692,-0.069,-0.171,0.013
106
- TiRex,TimesFM-2.5,0.519,0.327,0.731,0.008,-0.015,0.033
107
- TiRex,Toto-2.0-22m,0.577,0.385,0.769,-0.001,-0.024,0.017
108
- TiRex,FlowState,0.481,0.308,0.654,0.005,-0.022,0.033
109
- TiRex,Chronos-Bolt,0.558,0.385,0.731,0.004,-0.021,0.032
110
- TiRex,Moirai-2.0,0.558,0.365,0.731,0.024,-0.003,0.056
111
- TiRex,Toto-1.0,0.673,0.5,0.846,0.038,0.011,0.068
112
- TiRex,Sundial-Base,0.75,0.596,0.904,-0.012,-0.103,0.066
113
- TiRex,Seasonal Naive,0.923,0.808,1.0,0.251,0.191,0.308
114
- TabPFN-TS,Chronos-2,0.231,0.077,0.385,-0.084,-0.133,-0.039
115
- TabPFN-TS,Toto-2.0-2.5B,0.346,0.154,0.538,0.035,-0.043,0.117
116
- TabPFN-TS,Toto-2.0-1B,0.385,0.192,0.577,0.032,-0.05,0.115
117
- TabPFN-TS,Toto-2.0-313m,0.346,0.154,0.538,0.037,-0.045,0.124
118
- TabPFN-TS,TiRex-2,0.346,0.154,0.538,-0.035,-0.093,0.02
119
- TabPFN-TS,TabPFN-TS-3,0.269,0.115,0.423,-0.061,-0.112,-0.012
120
- TabPFN-TS,TiRex,0.5,0.308,0.692,0.065,-0.014,0.146
121
- TabPFN-TS,TabPFN-TS,0.5,0.5,0.5,0.0,0.0,0.0
122
- TabPFN-TS,TimesFM-2.5,0.5,0.308,0.692,0.073,-0.003,0.152
123
- TabPFN-TS,Toto-2.0-22m,0.5,0.308,0.692,0.063,-0.016,0.142
124
- TabPFN-TS,FlowState,0.654,0.462,0.846,0.069,-0.011,0.143
125
- TabPFN-TS,Chronos-Bolt,0.538,0.346,0.731,0.069,0.002,0.143
126
- TabPFN-TS,Moirai-2.0,0.5,0.308,0.692,0.087,0.008,0.169
127
- TabPFN-TS,Toto-1.0,0.577,0.385,0.769,0.1,0.022,0.181
128
- TabPFN-TS,Sundial-Base,0.5,0.308,0.692,0.054,-0.036,0.143
129
- TabPFN-TS,Seasonal Naive,0.923,0.808,1.0,0.299,0.216,0.373
130
- TimesFM-2.5,Chronos-2,0.231,0.077,0.423,-0.169,-0.269,-0.077
131
- TimesFM-2.5,Toto-2.0-2.5B,0.308,0.154,0.5,-0.04,-0.076,-0.01
132
- TimesFM-2.5,Toto-2.0-1B,0.231,0.077,0.423,-0.044,-0.08,-0.012
133
- TimesFM-2.5,Toto-2.0-313m,0.308,0.153,0.5,-0.038,-0.066,-0.012
134
- TimesFM-2.5,TiRex-2,0.346,0.192,0.538,-0.116,-0.214,-0.033
135
- TimesFM-2.5,TabPFN-TS-3,0.308,0.154,0.5,-0.144,-0.259,-0.04
136
- TimesFM-2.5,TiRex,0.481,0.269,0.673,-0.009,-0.034,0.014
137
- TimesFM-2.5,TabPFN-TS,0.5,0.308,0.692,-0.078,-0.179,0.003
138
- TimesFM-2.5,TimesFM-2.5,0.5,0.5,0.5,0.0,0.0,0.0
139
- TimesFM-2.5,Toto-2.0-22m,0.462,0.269,0.654,-0.01,-0.044,0.02
140
- TimesFM-2.5,FlowState,0.538,0.365,0.712,-0.004,-0.035,0.027
141
- TimesFM-2.5,Chronos-Bolt,0.577,0.404,0.769,-0.004,-0.033,0.024
142
- TimesFM-2.5,Moirai-2.0,0.615,0.442,0.808,0.016,-0.028,0.057
143
- TimesFM-2.5,Toto-1.0,0.692,0.519,0.846,0.03,-0.006,0.071
144
- TimesFM-2.5,Sundial-Base,0.596,0.423,0.788,-0.02,-0.113,0.062
145
- TimesFM-2.5,Seasonal Naive,0.923,0.808,1.0,0.245,0.182,0.306
146
- Toto-2.0-22m,Chronos-2,0.115,0.0,0.231,-0.158,-0.252,-0.077
147
- Toto-2.0-22m,Toto-2.0-2.5B,0.192,0.038,0.346,-0.03,-0.044,-0.016
148
- Toto-2.0-22m,Toto-2.0-1B,0.154,0.038,0.308,-0.033,-0.048,-0.021
149
- Toto-2.0-22m,Toto-2.0-313m,0.269,0.115,0.462,-0.028,-0.043,-0.014
150
- Toto-2.0-22m,TiRex-2,0.423,0.231,0.615,-0.105,-0.195,-0.029
151
- Toto-2.0-22m,TabPFN-TS-3,0.385,0.23,0.577,-0.133,-0.241,-0.035
152
- Toto-2.0-22m,TiRex,0.423,0.231,0.615,0.001,-0.018,0.024
153
- Toto-2.0-22m,TabPFN-TS,0.5,0.308,0.692,-0.067,-0.166,0.016
154
- Toto-2.0-22m,TimesFM-2.5,0.538,0.346,0.731,0.01,-0.02,0.042
155
- Toto-2.0-22m,Toto-2.0-22m,0.5,0.5,0.5,0.0,0.0,0.0
156
- Toto-2.0-22m,FlowState,0.423,0.268,0.615,0.006,-0.028,0.038
157
- Toto-2.0-22m,Chronos-Bolt,0.538,0.346,0.731,0.006,-0.025,0.036
158
- Toto-2.0-22m,Moirai-2.0,0.538,0.346,0.731,0.025,0.002,0.052
159
- Toto-2.0-22m,Toto-1.0,0.731,0.538,0.885,0.039,0.013,0.071
160
- Toto-2.0-22m,Sundial-Base,0.654,0.462,0.808,-0.01,-0.105,0.074
161
- Toto-2.0-22m,Seasonal Naive,0.885,0.731,1.0,0.252,0.188,0.315
162
- FlowState,Chronos-2,0.154,0.038,0.308,-0.165,-0.253,-0.079
163
- FlowState,Toto-2.0-2.5B,0.192,0.077,0.346,-0.037,-0.071,0.0
164
- FlowState,Toto-2.0-1B,0.231,0.077,0.385,-0.04,-0.074,-0.004
165
- FlowState,Toto-2.0-313m,0.231,0.077,0.385,-0.034,-0.066,-0.002
166
- FlowState,TiRex-2,0.269,0.115,0.423,-0.112,-0.204,-0.031
167
- FlowState,TabPFN-TS-3,0.308,0.154,0.5,-0.14,-0.246,-0.037
168
- FlowState,TiRex,0.519,0.346,0.692,-0.005,-0.034,0.022
169
- FlowState,TabPFN-TS,0.346,0.154,0.538,-0.074,-0.167,0.011
170
- FlowState,TimesFM-2.5,0.462,0.288,0.635,0.004,-0.027,0.034
171
- FlowState,Toto-2.0-22m,0.577,0.385,0.732,-0.006,-0.039,0.027
172
- FlowState,FlowState,0.5,0.5,0.5,0.0,0.0,0.0
173
- FlowState,Chronos-Bolt,0.538,0.365,0.712,-0.001,-0.029,0.034
174
- FlowState,Moirai-2.0,0.462,0.307,0.635,0.019,-0.019,0.062
175
- FlowState,Toto-1.0,0.577,0.404,0.75,0.033,-0.002,0.073
176
- FlowState,Sundial-Base,0.596,0.423,0.788,-0.017,-0.106,0.06
177
- FlowState,Seasonal Naive,0.846,0.692,0.962,0.247,0.177,0.309
178
- Chronos-Bolt,Chronos-2,0.038,0.0,0.115,-0.164,-0.254,-0.085
179
- Chronos-Bolt,Toto-2.0-2.5B,0.154,0.038,0.308,-0.036,-0.066,-0.005
180
- Chronos-Bolt,Toto-2.0-1B,0.154,0.038,0.308,-0.039,-0.071,-0.007
181
- Chronos-Bolt,Toto-2.0-313m,0.269,0.115,0.424,-0.034,-0.064,-0.004
182
- Chronos-Bolt,TiRex-2,0.346,0.154,0.538,-0.112,-0.213,-0.032
183
- Chronos-Bolt,TabPFN-TS-3,0.346,0.191,0.538,-0.14,-0.248,-0.045
184
- Chronos-Bolt,TiRex,0.442,0.269,0.615,-0.004,-0.034,0.02
185
- Chronos-Bolt,TabPFN-TS,0.462,0.269,0.654,-0.074,-0.167,-0.002
186
- Chronos-Bolt,TimesFM-2.5,0.423,0.231,0.596,0.004,-0.025,0.032
187
- Chronos-Bolt,Toto-2.0-22m,0.462,0.269,0.654,-0.006,-0.037,0.025
188
- Chronos-Bolt,FlowState,0.462,0.288,0.635,0.001,-0.035,0.028
189
- Chronos-Bolt,Chronos-Bolt,0.5,0.5,0.5,0.0,0.0,0.0
190
- Chronos-Bolt,Moirai-2.0,0.577,0.423,0.731,0.02,-0.022,0.064
191
- Chronos-Bolt,Toto-1.0,0.577,0.404,0.75,0.034,-0.001,0.072
192
- Chronos-Bolt,Sundial-Base,0.558,0.365,0.731,-0.016,-0.106,0.062
193
- Chronos-Bolt,Seasonal Naive,0.923,0.808,1.0,0.248,0.188,0.306
194
- Moirai-2.0,Chronos-2,0.077,0.0,0.192,-0.188,-0.285,-0.101
195
- Moirai-2.0,Toto-2.0-2.5B,0.154,0.038,0.308,-0.057,-0.091,-0.029
196
- Moirai-2.0,Toto-2.0-1B,0.154,0.038,0.308,-0.06,-0.091,-0.035
197
- Moirai-2.0,Toto-2.0-313m,0.231,0.077,0.423,-0.055,-0.087,-0.026
198
- Moirai-2.0,TiRex-2,0.308,0.154,0.462,-0.134,-0.221,-0.058
199
- Moirai-2.0,TabPFN-TS-3,0.346,0.192,0.538,-0.163,-0.282,-0.057
200
- Moirai-2.0,TiRex,0.442,0.269,0.635,-0.024,-0.059,0.003
201
- Moirai-2.0,TabPFN-TS,0.5,0.308,0.692,-0.095,-0.203,-0.008
202
- Moirai-2.0,TimesFM-2.5,0.385,0.192,0.558,-0.016,-0.061,0.027
203
- Moirai-2.0,Toto-2.0-22m,0.462,0.269,0.654,-0.026,-0.055,-0.002
204
- Moirai-2.0,FlowState,0.538,0.365,0.693,-0.019,-0.066,0.018
205
- Moirai-2.0,Chronos-Bolt,0.423,0.269,0.577,-0.02,-0.068,0.021
206
- Moirai-2.0,Moirai-2.0,0.5,0.5,0.5,0.0,0.0,0.0
207
- Moirai-2.0,Toto-1.0,0.615,0.462,0.788,0.014,-0.01,0.043
208
- Moirai-2.0,Sundial-Base,0.635,0.462,0.789,-0.036,-0.136,0.048
209
- Moirai-2.0,Seasonal Naive,0.808,0.654,0.924,0.233,0.167,0.293
210
- Toto-1.0,Chronos-2,0.154,0.038,0.308,-0.205,-0.31,-0.117
211
- Toto-1.0,Toto-2.0-2.5B,0.192,0.038,0.346,-0.072,-0.112,-0.041
212
- Toto-1.0,Toto-2.0-1B,0.192,0.077,0.346,-0.076,-0.114,-0.045
213
- Toto-1.0,Toto-2.0-313m,0.269,0.115,0.462,-0.07,-0.106,-0.039
214
- Toto-1.0,TiRex-2,0.308,0.154,0.462,-0.15,-0.25,-0.07
215
- Toto-1.0,TabPFN-TS-3,0.308,0.154,0.5,-0.179,-0.293,-0.078
216
- Toto-1.0,TiRex,0.327,0.154,0.5,-0.039,-0.073,-0.011
217
- Toto-1.0,TabPFN-TS,0.423,0.231,0.615,-0.111,-0.221,-0.022
218
- Toto-1.0,TimesFM-2.5,0.308,0.154,0.481,-0.03,-0.076,0.006
219
- Toto-1.0,Toto-2.0-22m,0.269,0.115,0.462,-0.041,-0.077,-0.014
220
- Toto-1.0,FlowState,0.423,0.25,0.596,-0.034,-0.078,0.002
221
- Toto-1.0,Chronos-Bolt,0.423,0.25,0.596,-0.035,-0.078,0.001
222
- Toto-1.0,Moirai-2.0,0.385,0.212,0.538,-0.014,-0.045,0.01
223
- Toto-1.0,Toto-1.0,0.5,0.5,0.5,0.0,0.0,0.0
224
- Toto-1.0,Sundial-Base,0.519,0.346,0.692,-0.051,-0.149,0.03
225
- Toto-1.0,Seasonal Naive,0.885,0.731,1.0,0.222,0.159,0.278
226
- Sundial-Base,Chronos-2,0.154,0.038,0.308,-0.146,-0.242,-0.074
227
- Sundial-Base,Toto-2.0-2.5B,0.231,0.077,0.385,-0.02,-0.121,0.066
228
- Sundial-Base,Toto-2.0-1B,0.269,0.115,0.423,-0.023,-0.124,0.063
229
- Sundial-Base,Toto-2.0-313m,0.192,0.038,0.346,-0.018,-0.11,0.067
230
- Sundial-Base,TiRex-2,0.192,0.038,0.346,-0.094,-0.196,-0.006
231
- Sundial-Base,TabPFN-TS-3,0.231,0.077,0.385,-0.122,-0.227,-0.04
232
- Sundial-Base,TiRex,0.25,0.096,0.404,0.012,-0.071,0.093
233
- Sundial-Base,TabPFN-TS,0.5,0.308,0.692,-0.057,-0.166,0.035
234
- Sundial-Base,TimesFM-2.5,0.404,0.212,0.577,0.02,-0.066,0.101
235
- Sundial-Base,Toto-2.0-22m,0.346,0.192,0.538,0.01,-0.08,0.095
236
- Sundial-Base,FlowState,0.404,0.212,0.577,0.016,-0.064,0.096
237
- Sundial-Base,Chronos-Bolt,0.442,0.269,0.635,0.016,-0.066,0.096
238
- Sundial-Base,Moirai-2.0,0.365,0.211,0.538,0.035,-0.051,0.119
239
- Sundial-Base,Toto-1.0,0.481,0.308,0.654,0.049,-0.031,0.129
240
- Sundial-Base,Sundial-Base,0.5,0.5,0.5,0.0,0.0,0.0
241
- Sundial-Base,Seasonal Naive,0.885,0.731,1.0,0.26,0.177,0.334
242
- Seasonal Naive,Chronos-2,0.038,0.0,0.115,-0.548,-0.729,-0.384
243
- Seasonal Naive,Toto-2.0-2.5B,0.038,0.0,0.115,-0.377,-0.504,-0.267
244
- Seasonal Naive,Toto-2.0-1B,0.077,0.0,0.192,-0.382,-0.514,-0.266
245
- Seasonal Naive,Toto-2.0-313m,0.077,0.0,0.192,-0.375,-0.505,-0.259
246
- Seasonal Naive,TiRex-2,0.038,0.0,0.115,-0.478,-0.652,-0.321
247
- Seasonal Naive,TabPFN-TS-3,0.038,0.0,0.115,-0.515,-0.695,-0.36
248
- Seasonal Naive,TiRex,0.077,0.0,0.192,-0.335,-0.445,-0.237
249
- Seasonal Naive,TabPFN-TS,0.077,0.0,0.192,-0.428,-0.596,-0.276
250
- Seasonal Naive,TimesFM-2.5,0.077,0.0,0.192,-0.324,-0.441,-0.223
251
- Seasonal Naive,Toto-2.0-22m,0.115,0.0,0.269,-0.337,-0.46,-0.231
252
- Seasonal Naive,FlowState,0.154,0.038,0.308,-0.329,-0.447,-0.215
253
- Seasonal Naive,Chronos-Bolt,0.077,0.0,0.192,-0.33,-0.44,-0.232
254
- Seasonal Naive,Moirai-2.0,0.192,0.076,0.346,-0.303,-0.415,-0.201
255
- Seasonal Naive,Toto-1.0,0.115,0.0,0.269,-0.285,-0.386,-0.189
256
- Seasonal Naive,Sundial-Base,0.115,0.0,0.269,-0.351,-0.501,-0.215
257
- Seasonal Naive,Seasonal Naive,0.5,0.5,0.5,0.0,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_energy/pairwise_SQL.csv DELETED
@@ -1,257 +0,0 @@
1
- model_1,model_2,win_rate,win_rate_lower,win_rate_upper,skill_score,skill_score_lower,skill_score_upper
2
- Chronos-2,Chronos-2,0.5,0.5,0.5,0.0,0.0,0.0
3
- Chronos-2,Toto-2.0-1B,0.615,0.423,0.808,0.104,0.037,0.17
4
- Chronos-2,Toto-2.0-2.5B,0.654,0.462,0.808,0.107,0.041,0.173
5
- Chronos-2,TiRex-2,0.462,0.269,0.654,0.046,0.003,0.094
6
- Chronos-2,Toto-2.0-313m,0.615,0.423,0.808,0.111,0.041,0.178
7
- Chronos-2,TabPFN-TS-3,0.654,0.462,0.846,0.027,-0.009,0.067
8
- Chronos-2,TiRex,0.731,0.538,0.885,0.141,0.072,0.204
9
- Chronos-2,Toto-2.0-22m,0.808,0.654,0.923,0.137,0.072,0.202
10
- Chronos-2,TabPFN-TS,0.808,0.654,0.923,0.082,0.044,0.12
11
- Chronos-2,TimesFM-2.5,0.769,0.577,0.923,0.159,0.083,0.225
12
- Chronos-2,FlowState,0.885,0.731,1.0,0.167,0.099,0.227
13
- Chronos-2,Moirai-2.0,0.923,0.808,1.0,0.178,0.111,0.242
14
- Chronos-2,Chronos-Bolt,0.923,0.808,1.0,0.161,0.096,0.219
15
- Chronos-2,Toto-1.0,0.846,0.692,0.962,0.183,0.115,0.249
16
- Chronos-2,Toto-2.0-4m,0.885,0.768,1.0,0.178,0.104,0.248
17
- Chronos-2,Seasonal Naive,1.0,1.0,1.0,0.437,0.368,0.497
18
- Toto-2.0-1B,Chronos-2,0.385,0.192,0.577,-0.116,-0.204,-0.038
19
- Toto-2.0-1B,Toto-2.0-1B,0.5,0.5,0.5,0.0,0.0,0.0
20
- Toto-2.0-1B,Toto-2.0-2.5B,0.538,0.346,0.692,0.004,-0.003,0.012
21
- Toto-2.0-1B,TiRex-2,0.5,0.308,0.692,-0.064,-0.157,0.009
22
- Toto-2.0-1B,Toto-2.0-313m,0.577,0.385,0.769,0.008,-0.003,0.02
23
- Toto-2.0-1B,TabPFN-TS-3,0.462,0.269,0.654,-0.085,-0.194,0.015
24
- Toto-2.0-1B,TiRex,0.692,0.5,0.846,0.042,0.016,0.07
25
- Toto-2.0-1B,Toto-2.0-22m,0.885,0.731,1.0,0.038,0.025,0.054
26
- Toto-2.0-1B,TabPFN-TS,0.654,0.462,0.846,-0.024,-0.12,0.056
27
- Toto-2.0-1B,TimesFM-2.5,0.808,0.654,0.962,0.062,0.029,0.096
28
- Toto-2.0-1B,FlowState,0.846,0.692,0.962,0.071,0.039,0.104
29
- Toto-2.0-1B,Moirai-2.0,0.846,0.692,0.962,0.083,0.055,0.111
30
- Toto-2.0-1B,Chronos-Bolt,0.846,0.692,0.962,0.064,0.029,0.097
31
- Toto-2.0-1B,Toto-1.0,0.923,0.808,1.0,0.088,0.059,0.12
32
- Toto-2.0-1B,Toto-2.0-4m,0.885,0.731,1.0,0.083,0.051,0.117
33
- Toto-2.0-1B,Seasonal Naive,1.0,1.0,1.0,0.372,0.312,0.433
34
- Toto-2.0-2.5B,Chronos-2,0.346,0.192,0.538,-0.12,-0.209,-0.043
35
- Toto-2.0-2.5B,Toto-2.0-1B,0.462,0.308,0.654,-0.004,-0.012,0.003
36
- Toto-2.0-2.5B,Toto-2.0-2.5B,0.5,0.5,0.5,0.0,0.0,0.0
37
- Toto-2.0-2.5B,TiRex-2,0.5,0.308,0.692,-0.068,-0.162,0.007
38
- Toto-2.0-2.5B,Toto-2.0-313m,0.692,0.538,0.846,0.004,-0.008,0.015
39
- Toto-2.0-2.5B,TabPFN-TS-3,0.423,0.231,0.615,-0.09,-0.198,0.008
40
- Toto-2.0-2.5B,TiRex,0.731,0.538,0.885,0.038,0.013,0.065
41
- Toto-2.0-2.5B,Toto-2.0-22m,0.808,0.654,0.962,0.034,0.021,0.048
42
- Toto-2.0-2.5B,TabPFN-TS,0.654,0.462,0.846,-0.028,-0.125,0.049
43
- Toto-2.0-2.5B,TimesFM-2.5,0.692,0.5,0.846,0.058,0.025,0.092
44
- Toto-2.0-2.5B,FlowState,0.846,0.692,0.962,0.067,0.035,0.101
45
- Toto-2.0-2.5B,Moirai-2.0,0.885,0.768,1.0,0.079,0.051,0.108
46
- Toto-2.0-2.5B,Chronos-Bolt,0.885,0.768,1.0,0.061,0.028,0.091
47
- Toto-2.0-2.5B,Toto-1.0,0.885,0.769,1.0,0.085,0.057,0.115
48
- Toto-2.0-2.5B,Toto-2.0-4m,0.846,0.692,0.962,0.08,0.048,0.112
49
- Toto-2.0-2.5B,Seasonal Naive,1.0,1.0,1.0,0.369,0.312,0.43
50
- TiRex-2,Chronos-2,0.538,0.346,0.731,-0.049,-0.104,-0.003
51
- TiRex-2,Toto-2.0-1B,0.5,0.308,0.692,0.06,-0.009,0.136
52
- TiRex-2,Toto-2.0-2.5B,0.5,0.308,0.692,0.064,-0.007,0.139
53
- TiRex-2,TiRex-2,0.5,0.5,0.5,0.0,0.0,0.0
54
- TiRex-2,Toto-2.0-313m,0.5,0.308,0.692,0.067,-0.004,0.147
55
- TiRex-2,TabPFN-TS-3,0.577,0.385,0.769,-0.02,-0.087,0.038
56
- TiRex-2,TiRex,0.692,0.538,0.846,0.099,0.033,0.169
57
- TiRex-2,Toto-2.0-22m,0.577,0.385,0.769,0.095,0.027,0.165
58
- TiRex-2,TabPFN-TS,0.654,0.462,0.846,0.038,-0.015,0.087
59
- TiRex-2,TimesFM-2.5,0.731,0.538,0.885,0.118,0.044,0.193
60
- TiRex-2,FlowState,0.731,0.577,0.885,0.126,0.058,0.197
61
- TiRex-2,Moirai-2.0,0.808,0.654,0.923,0.138,0.076,0.204
62
- TiRex-2,Chronos-Bolt,0.846,0.692,0.962,0.12,0.05,0.194
63
- TiRex-2,Toto-1.0,0.769,0.615,0.923,0.143,0.077,0.212
64
- TiRex-2,Toto-2.0-4m,0.885,0.769,1.0,0.138,0.066,0.209
65
- TiRex-2,Seasonal Naive,1.0,1.0,1.0,0.41,0.334,0.479
66
- Toto-2.0-313m,Chronos-2,0.385,0.192,0.577,-0.124,-0.216,-0.043
67
- Toto-2.0-313m,Toto-2.0-1B,0.423,0.231,0.615,-0.008,-0.02,0.003
68
- Toto-2.0-313m,Toto-2.0-2.5B,0.308,0.154,0.462,-0.004,-0.015,0.008
69
- Toto-2.0-313m,TiRex-2,0.5,0.308,0.692,-0.072,-0.172,0.004
70
- Toto-2.0-313m,Toto-2.0-313m,0.5,0.5,0.5,0.0,0.0,0.0
71
- Toto-2.0-313m,TabPFN-TS-3,0.462,0.269,0.654,-0.094,-0.204,0.006
72
- Toto-2.0-313m,TiRex,0.654,0.462,0.846,0.034,0.013,0.057
73
- Toto-2.0-313m,Toto-2.0-22m,0.769,0.614,0.923,0.03,0.017,0.045
74
- Toto-2.0-313m,TabPFN-TS,0.615,0.423,0.808,-0.032,-0.133,0.048
75
- Toto-2.0-313m,TimesFM-2.5,0.731,0.538,0.885,0.055,0.025,0.084
76
- Toto-2.0-313m,FlowState,0.808,0.654,0.962,0.063,0.034,0.094
77
- Toto-2.0-313m,Moirai-2.0,0.769,0.577,0.923,0.075,0.046,0.105
78
- Toto-2.0-313m,Chronos-Bolt,0.808,0.654,0.962,0.057,0.023,0.089
79
- Toto-2.0-313m,Toto-1.0,0.846,0.692,0.962,0.081,0.051,0.111
80
- Toto-2.0-313m,Toto-2.0-4m,0.846,0.692,0.962,0.076,0.046,0.105
81
- Toto-2.0-313m,Seasonal Naive,1.0,1.0,1.0,0.367,0.309,0.428
82
- TabPFN-TS-3,Chronos-2,0.346,0.154,0.538,-0.028,-0.072,0.009
83
- TabPFN-TS-3,Toto-2.0-1B,0.538,0.346,0.731,0.079,-0.015,0.163
84
- TabPFN-TS-3,Toto-2.0-2.5B,0.577,0.385,0.769,0.082,-0.008,0.165
85
- TabPFN-TS-3,TiRex-2,0.423,0.231,0.615,0.02,-0.04,0.08
86
- TabPFN-TS-3,Toto-2.0-313m,0.538,0.346,0.731,0.086,-0.006,0.169
87
- TabPFN-TS-3,TabPFN-TS-3,0.5,0.5,0.5,0.0,0.0,0.0
88
- TabPFN-TS-3,TiRex,0.577,0.385,0.769,0.117,0.03,0.195
89
- TabPFN-TS-3,Toto-2.0-22m,0.615,0.423,0.808,0.113,0.029,0.192
90
- TabPFN-TS-3,TabPFN-TS,0.769,0.615,0.923,0.057,0.008,0.098
91
- TabPFN-TS-3,TimesFM-2.5,0.654,0.462,0.809,0.136,0.046,0.217
92
- TabPFN-TS-3,FlowState,0.731,0.538,0.885,0.144,0.053,0.217
93
- TabPFN-TS-3,Moirai-2.0,0.692,0.5,0.846,0.155,0.07,0.235
94
- TabPFN-TS-3,Chronos-Bolt,0.769,0.615,0.923,0.138,0.059,0.21
95
- TabPFN-TS-3,Toto-1.0,0.731,0.538,0.885,0.16,0.078,0.237
96
- TabPFN-TS-3,Toto-2.0-4m,0.692,0.5,0.846,0.155,0.067,0.235
97
- TabPFN-TS-3,Seasonal Naive,1.0,1.0,1.0,0.421,0.35,0.49
98
- TiRex,Chronos-2,0.269,0.115,0.462,-0.164,-0.257,-0.078
99
- TiRex,Toto-2.0-1B,0.308,0.154,0.5,-0.044,-0.075,-0.016
100
- TiRex,Toto-2.0-2.5B,0.269,0.115,0.462,-0.04,-0.069,-0.013
101
- TiRex,TiRex-2,0.308,0.154,0.462,-0.11,-0.204,-0.034
102
- TiRex,Toto-2.0-313m,0.346,0.154,0.538,-0.035,-0.061,-0.013
103
- TiRex,TabPFN-TS-3,0.423,0.231,0.615,-0.133,-0.242,-0.031
104
- TiRex,TiRex,0.5,0.5,0.5,0.0,0.0,0.0
105
- TiRex,Toto-2.0-22m,0.538,0.346,0.731,-0.004,-0.029,0.02
106
- TiRex,TabPFN-TS,0.5,0.308,0.692,-0.068,-0.171,0.014
107
- TiRex,TimesFM-2.5,0.673,0.481,0.846,0.021,-0.002,0.045
108
- TiRex,FlowState,0.635,0.461,0.808,0.03,0.003,0.06
109
- TiRex,Moirai-2.0,0.788,0.615,0.923,0.043,0.014,0.075
110
- TiRex,Chronos-Bolt,0.75,0.577,0.885,0.023,-0.005,0.052
111
- TiRex,Toto-1.0,0.788,0.615,0.923,0.048,0.024,0.076
112
- TiRex,Toto-2.0-4m,0.769,0.614,0.923,0.043,0.012,0.072
113
- TiRex,Seasonal Naive,1.0,1.0,1.0,0.344,0.286,0.404
114
- Toto-2.0-22m,Chronos-2,0.192,0.077,0.346,-0.159,-0.254,-0.077
115
- Toto-2.0-22m,Toto-2.0-1B,0.115,0.0,0.269,-0.039,-0.057,-0.025
116
- Toto-2.0-22m,Toto-2.0-2.5B,0.192,0.038,0.346,-0.035,-0.05,-0.021
117
- Toto-2.0-22m,TiRex-2,0.423,0.231,0.615,-0.106,-0.198,-0.028
118
- Toto-2.0-22m,Toto-2.0-313m,0.231,0.077,0.386,-0.031,-0.047,-0.018
119
- Toto-2.0-22m,TabPFN-TS-3,0.385,0.192,0.577,-0.128,-0.238,-0.029
120
- Toto-2.0-22m,TiRex,0.462,0.269,0.654,0.004,-0.02,0.028
121
- Toto-2.0-22m,Toto-2.0-22m,0.5,0.5,0.5,0.0,0.0,0.0
122
- Toto-2.0-22m,TabPFN-TS,0.5,0.308,0.692,-0.064,-0.17,0.021
123
- Toto-2.0-22m,TimesFM-2.5,0.615,0.423,0.808,0.025,-0.009,0.059
124
- Toto-2.0-22m,FlowState,0.615,0.423,0.808,0.034,-0.001,0.07
125
- Toto-2.0-22m,Moirai-2.0,0.654,0.462,0.846,0.047,0.018,0.075
126
- Toto-2.0-22m,Chronos-Bolt,0.692,0.5,0.885,0.027,-0.009,0.062
127
- Toto-2.0-22m,Toto-1.0,0.769,0.615,0.923,0.052,0.03,0.079
128
- Toto-2.0-22m,Toto-2.0-4m,0.731,0.577,0.885,0.047,0.022,0.073
129
- Toto-2.0-22m,Seasonal Naive,1.0,1.0,1.0,0.347,0.288,0.407
130
- TabPFN-TS,Chronos-2,0.192,0.077,0.346,-0.09,-0.136,-0.046
131
- TabPFN-TS,Toto-2.0-1B,0.346,0.154,0.538,0.023,-0.059,0.107
132
- TabPFN-TS,Toto-2.0-2.5B,0.346,0.154,0.538,0.027,-0.051,0.111
133
- TabPFN-TS,TiRex-2,0.346,0.154,0.538,-0.039,-0.095,0.015
134
- TabPFN-TS,Toto-2.0-313m,0.385,0.192,0.577,0.031,-0.05,0.117
135
- TabPFN-TS,TabPFN-TS-3,0.231,0.077,0.385,-0.06,-0.109,-0.008
136
- TabPFN-TS,TiRex,0.5,0.308,0.692,0.064,-0.014,0.146
137
- TabPFN-TS,Toto-2.0-22m,0.5,0.308,0.692,0.06,-0.022,0.145
138
- TabPFN-TS,TabPFN-TS,0.5,0.5,0.5,0.0,0.0,0.0
139
- TabPFN-TS,TimesFM-2.5,0.5,0.308,0.692,0.084,0.006,0.167
140
- TabPFN-TS,FlowState,0.615,0.423,0.808,0.092,0.015,0.166
141
- TabPFN-TS,Moirai-2.0,0.577,0.385,0.769,0.104,0.024,0.189
142
- TabPFN-TS,Chronos-Bolt,0.654,0.462,0.846,0.086,0.022,0.16
143
- TabPFN-TS,Toto-1.0,0.577,0.385,0.769,0.109,0.026,0.194
144
- TabPFN-TS,Toto-2.0-4m,0.615,0.423,0.808,0.105,0.018,0.189
145
- TabPFN-TS,Seasonal Naive,1.0,1.0,1.0,0.386,0.308,0.462
146
- TimesFM-2.5,Chronos-2,0.231,0.077,0.423,-0.189,-0.291,-0.09
147
- TimesFM-2.5,Toto-2.0-1B,0.192,0.038,0.346,-0.066,-0.106,-0.029
148
- TimesFM-2.5,Toto-2.0-2.5B,0.308,0.154,0.5,-0.062,-0.102,-0.025
149
- TimesFM-2.5,TiRex-2,0.269,0.115,0.462,-0.134,-0.24,-0.046
150
- TimesFM-2.5,Toto-2.0-313m,0.269,0.115,0.462,-0.058,-0.092,-0.026
151
- TimesFM-2.5,TabPFN-TS-3,0.346,0.191,0.538,-0.157,-0.277,-0.048
152
- TimesFM-2.5,TiRex,0.327,0.154,0.519,-0.021,-0.047,0.002
153
- TimesFM-2.5,Toto-2.0-22m,0.385,0.192,0.577,-0.026,-0.062,0.009
154
- TimesFM-2.5,TabPFN-TS,0.5,0.308,0.692,-0.091,-0.2,-0.006
155
- TimesFM-2.5,TimesFM-2.5,0.5,0.5,0.5,0.0,0.0,0.0
156
- TimesFM-2.5,FlowState,0.577,0.404,0.75,0.009,-0.023,0.04
157
- TimesFM-2.5,Moirai-2.0,0.615,0.442,0.808,0.022,-0.023,0.067
158
- TimesFM-2.5,Chronos-Bolt,0.538,0.365,0.712,0.002,-0.028,0.029
159
- TimesFM-2.5,Toto-1.0,0.654,0.462,0.808,0.028,-0.012,0.068
160
- TimesFM-2.5,Toto-2.0-4m,0.615,0.423,0.808,0.023,-0.015,0.057
161
- TimesFM-2.5,Seasonal Naive,1.0,1.0,1.0,0.33,0.269,0.394
162
- FlowState,Chronos-2,0.115,0.0,0.269,-0.2,-0.294,-0.11
163
- FlowState,Toto-2.0-1B,0.154,0.038,0.308,-0.076,-0.116,-0.04
164
- FlowState,Toto-2.0-2.5B,0.154,0.038,0.308,-0.072,-0.113,-0.036
165
- FlowState,TiRex-2,0.269,0.115,0.423,-0.145,-0.245,-0.061
166
- FlowState,Toto-2.0-313m,0.192,0.038,0.346,-0.068,-0.104,-0.035
167
- FlowState,TabPFN-TS-3,0.269,0.115,0.462,-0.168,-0.277,-0.057
168
- FlowState,TiRex,0.365,0.192,0.539,-0.031,-0.064,-0.003
169
- FlowState,Toto-2.0-22m,0.385,0.192,0.577,-0.035,-0.075,0.001
170
- FlowState,TabPFN-TS,0.385,0.192,0.577,-0.102,-0.199,-0.015
171
- FlowState,TimesFM-2.5,0.423,0.25,0.596,-0.009,-0.042,0.022
172
- FlowState,FlowState,0.5,0.5,0.5,0.0,0.0,0.0
173
- FlowState,Moirai-2.0,0.538,0.384,0.712,0.013,-0.029,0.059
174
- FlowState,Chronos-Bolt,0.538,0.365,0.712,-0.007,-0.041,0.029
175
- FlowState,Toto-1.0,0.423,0.269,0.596,0.019,-0.019,0.059
176
- FlowState,Toto-2.0-4m,0.654,0.462,0.809,0.014,-0.03,0.052
177
- FlowState,Seasonal Naive,0.962,0.885,1.0,0.324,0.259,0.389
178
- Moirai-2.0,Chronos-2,0.077,0.0,0.192,-0.216,-0.319,-0.125
179
- Moirai-2.0,Toto-2.0-1B,0.154,0.038,0.308,-0.09,-0.125,-0.058
180
- Moirai-2.0,Toto-2.0-2.5B,0.115,0.0,0.232,-0.086,-0.122,-0.054
181
- Moirai-2.0,TiRex-2,0.192,0.077,0.346,-0.16,-0.257,-0.082
182
- Moirai-2.0,Toto-2.0-313m,0.231,0.077,0.423,-0.082,-0.117,-0.048
183
- Moirai-2.0,TabPFN-TS-3,0.308,0.154,0.5,-0.183,-0.308,-0.075
184
- Moirai-2.0,TiRex,0.212,0.077,0.385,-0.045,-0.081,-0.014
185
- Moirai-2.0,Toto-2.0-22m,0.346,0.154,0.538,-0.049,-0.081,-0.018
186
- Moirai-2.0,TabPFN-TS,0.423,0.231,0.615,-0.116,-0.233,-0.025
187
- Moirai-2.0,TimesFM-2.5,0.385,0.192,0.558,-0.023,-0.071,0.023
188
- Moirai-2.0,FlowState,0.462,0.288,0.616,-0.013,-0.062,0.029
189
- Moirai-2.0,Moirai-2.0,0.5,0.5,0.5,0.0,0.0,0.0
190
- Moirai-2.0,Chronos-Bolt,0.5,0.346,0.673,-0.02,-0.075,0.025
191
- Moirai-2.0,Toto-1.0,0.577,0.423,0.75,0.006,-0.016,0.034
192
- Moirai-2.0,Toto-2.0-4m,0.5,0.308,0.692,0.001,-0.036,0.039
193
- Moirai-2.0,Seasonal Naive,0.923,0.808,1.0,0.315,0.249,0.385
194
- Chronos-Bolt,Chronos-2,0.077,0.0,0.192,-0.192,-0.28,-0.106
195
- Chronos-Bolt,Toto-2.0-1B,0.154,0.038,0.308,-0.069,-0.108,-0.029
196
- Chronos-Bolt,Toto-2.0-2.5B,0.115,0.0,0.232,-0.064,-0.101,-0.028
197
- Chronos-Bolt,TiRex-2,0.154,0.038,0.308,-0.137,-0.24,-0.053
198
- Chronos-Bolt,Toto-2.0-313m,0.192,0.038,0.346,-0.06,-0.097,-0.024
199
- Chronos-Bolt,TabPFN-TS-3,0.231,0.077,0.385,-0.16,-0.266,-0.063
200
- Chronos-Bolt,TiRex,0.25,0.115,0.423,-0.024,-0.055,0.005
201
- Chronos-Bolt,Toto-2.0-22m,0.308,0.115,0.5,-0.028,-0.066,0.009
202
- Chronos-Bolt,TabPFN-TS,0.346,0.154,0.538,-0.094,-0.19,-0.023
203
- Chronos-Bolt,TimesFM-2.5,0.462,0.288,0.635,-0.002,-0.03,0.027
204
- Chronos-Bolt,FlowState,0.462,0.288,0.635,0.007,-0.03,0.039
205
- Chronos-Bolt,Moirai-2.0,0.5,0.327,0.654,0.02,-0.025,0.07
206
- Chronos-Bolt,Chronos-Bolt,0.5,0.5,0.5,0.0,0.0,0.0
207
- Chronos-Bolt,Toto-1.0,0.538,0.365,0.712,0.026,-0.013,0.068
208
- Chronos-Bolt,Toto-2.0-4m,0.5,0.308,0.692,0.021,-0.023,0.063
209
- Chronos-Bolt,Seasonal Naive,1.0,1.0,1.0,0.329,0.273,0.388
210
- Toto-1.0,Chronos-2,0.154,0.038,0.308,-0.224,-0.332,-0.13
211
- Toto-1.0,Toto-2.0-1B,0.077,0.0,0.192,-0.097,-0.136,-0.063
212
- Toto-1.0,Toto-2.0-2.5B,0.115,0.0,0.231,-0.092,-0.13,-0.06
213
- Toto-1.0,TiRex-2,0.231,0.077,0.385,-0.167,-0.27,-0.084
214
- Toto-1.0,Toto-2.0-313m,0.154,0.038,0.308,-0.088,-0.125,-0.054
215
- Toto-1.0,TabPFN-TS-3,0.269,0.115,0.462,-0.19,-0.311,-0.085
216
- Toto-1.0,TiRex,0.212,0.077,0.385,-0.051,-0.082,-0.024
217
- Toto-1.0,Toto-2.0-22m,0.231,0.077,0.385,-0.055,-0.085,-0.031
218
- Toto-1.0,TabPFN-TS,0.423,0.231,0.615,-0.123,-0.241,-0.027
219
- Toto-1.0,TimesFM-2.5,0.346,0.192,0.538,-0.029,-0.073,0.011
220
- Toto-1.0,FlowState,0.577,0.404,0.731,-0.019,-0.063,0.019
221
- Toto-1.0,Moirai-2.0,0.423,0.25,0.577,-0.006,-0.035,0.016
222
- Toto-1.0,Chronos-Bolt,0.462,0.288,0.635,-0.026,-0.072,0.013
223
- Toto-1.0,Toto-1.0,0.5,0.5,0.5,0.0,0.0,0.0
224
- Toto-1.0,Toto-2.0-4m,0.5,0.308,0.692,-0.005,-0.037,0.02
225
- Toto-1.0,Seasonal Naive,0.962,0.885,1.0,0.311,0.248,0.377
226
- Toto-2.0-4m,Chronos-2,0.115,0.0,0.232,-0.217,-0.33,-0.116
227
- Toto-2.0-4m,Toto-2.0-1B,0.115,0.0,0.269,-0.091,-0.132,-0.054
228
- Toto-2.0-4m,Toto-2.0-2.5B,0.154,0.038,0.308,-0.087,-0.126,-0.05
229
- Toto-2.0-4m,TiRex-2,0.115,0.0,0.231,-0.161,-0.264,-0.071
230
- Toto-2.0-4m,Toto-2.0-313m,0.154,0.038,0.308,-0.082,-0.117,-0.049
231
- Toto-2.0-4m,TabPFN-TS-3,0.308,0.154,0.5,-0.184,-0.307,-0.072
232
- Toto-2.0-4m,TiRex,0.231,0.077,0.386,-0.045,-0.078,-0.012
233
- Toto-2.0-4m,Toto-2.0-22m,0.269,0.115,0.423,-0.05,-0.079,-0.023
234
- Toto-2.0-4m,TabPFN-TS,0.385,0.192,0.577,-0.117,-0.234,-0.018
235
- Toto-2.0-4m,TimesFM-2.5,0.385,0.192,0.577,-0.023,-0.061,0.015
236
- Toto-2.0-4m,FlowState,0.346,0.191,0.538,-0.014,-0.054,0.029
237
- Toto-2.0-4m,Moirai-2.0,0.5,0.308,0.692,-0.001,-0.041,0.035
238
- Toto-2.0-4m,Chronos-Bolt,0.5,0.308,0.692,-0.021,-0.067,0.023
239
- Toto-2.0-4m,Toto-1.0,0.5,0.308,0.692,0.005,-0.02,0.036
240
- Toto-2.0-4m,Toto-2.0-4m,0.5,0.5,0.5,0.0,0.0,0.0
241
- Toto-2.0-4m,Seasonal Naive,1.0,1.0,1.0,0.315,0.256,0.378
242
- Seasonal Naive,Chronos-2,0.0,0.0,0.0,-0.776,-0.987,-0.581
243
- Seasonal Naive,Toto-2.0-1B,0.0,0.0,0.0,-0.592,-0.765,-0.454
244
- Seasonal Naive,Toto-2.0-2.5B,0.0,0.0,0.0,-0.586,-0.754,-0.453
245
- Seasonal Naive,TiRex-2,0.0,0.0,0.0,-0.694,-0.92,-0.5
246
- Seasonal Naive,Toto-2.0-313m,0.0,0.0,0.0,-0.58,-0.749,-0.446
247
- Seasonal Naive,TabPFN-TS-3,0.0,0.0,0.0,-0.728,-0.962,-0.539
248
- Seasonal Naive,TiRex,0.0,0.0,0.0,-0.526,-0.679,-0.401
249
- Seasonal Naive,Toto-2.0-22m,0.0,0.0,0.0,-0.532,-0.686,-0.404
250
- Seasonal Naive,TabPFN-TS,0.0,0.0,0.0,-0.63,-0.858,-0.445
251
- Seasonal Naive,TimesFM-2.5,0.0,0.0,0.0,-0.493,-0.65,-0.368
252
- Seasonal Naive,FlowState,0.038,0.0,0.115,-0.48,-0.638,-0.35
253
- Seasonal Naive,Moirai-2.0,0.077,0.0,0.192,-0.46,-0.627,-0.331
254
- Seasonal Naive,Chronos-Bolt,0.0,0.0,0.0,-0.49,-0.633,-0.376
255
- Seasonal Naive,Toto-1.0,0.038,0.0,0.115,-0.452,-0.604,-0.33
256
- Seasonal Naive,Toto-2.0-4m,0.0,0.0,0.0,-0.459,-0.608,-0.344
257
- Seasonal Naive,Seasonal Naive,0.5,0.5,0.5,0.0,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_energy/pairwise_WAPE.csv DELETED
@@ -1,257 +0,0 @@
1
- model_1,model_2,win_rate,win_rate_lower,win_rate_upper,skill_score,skill_score_lower,skill_score_upper
2
- Chronos-2,Chronos-2,0.5,0.5,0.5,0.0,0.0,0.0
3
- Chronos-2,Toto-2.0-313m,0.615,0.423,0.808,0.099,0.028,0.168
4
- Chronos-2,Toto-2.0-1B,0.615,0.423,0.808,0.095,0.019,0.17
5
- Chronos-2,Toto-2.0-2.5B,0.615,0.423,0.808,0.104,0.03,0.173
6
- Chronos-2,TiRex-2,0.615,0.423,0.808,0.048,0.002,0.096
7
- Chronos-2,TabPFN-TS-3,0.731,0.538,0.885,0.045,-0.012,0.099
8
- Chronos-2,Toto-2.0-22m,0.692,0.5,0.846,0.122,0.054,0.188
9
- Chronos-2,TabPFN-TS,0.808,0.654,0.923,0.103,0.035,0.178
10
- Chronos-2,TiRex,0.846,0.692,0.962,0.141,0.074,0.204
11
- Chronos-2,TimesFM-2.5,0.731,0.538,0.885,0.149,0.075,0.214
12
- Chronos-2,Moirai-2.0,0.885,0.731,1.0,0.156,0.089,0.221
13
- Chronos-2,Chronos-Bolt,0.923,0.808,1.0,0.149,0.081,0.219
14
- Chronos-2,FlowState,0.808,0.654,0.923,0.146,0.079,0.202
15
- Chronos-2,Sundial-Base,0.846,0.692,0.962,0.13,0.071,0.194
16
- Chronos-2,Toto-1.0,0.885,0.769,1.0,0.176,0.109,0.244
17
- Chronos-2,Seasonal Naive,0.923,0.808,1.0,0.376,0.282,0.449
18
- Toto-2.0-313m,Chronos-2,0.385,0.192,0.577,-0.11,-0.202,-0.029
19
- Toto-2.0-313m,Toto-2.0-313m,0.5,0.5,0.5,0.0,0.0,0.0
20
- Toto-2.0-313m,Toto-2.0-1B,0.538,0.346,0.731,-0.005,-0.026,0.012
21
- Toto-2.0-313m,Toto-2.0-2.5B,0.423,0.231,0.615,0.006,-0.007,0.018
22
- Toto-2.0-313m,TiRex-2,0.538,0.346,0.731,-0.057,-0.158,0.028
23
- Toto-2.0-313m,TabPFN-TS-3,0.577,0.385,0.769,-0.06,-0.174,0.05
24
- Toto-2.0-313m,Toto-2.0-22m,0.731,0.538,0.885,0.026,0.005,0.044
25
- Toto-2.0-313m,TabPFN-TS,0.692,0.5,0.846,0.005,-0.109,0.1
26
- Toto-2.0-313m,TiRex,0.654,0.462,0.846,0.047,0.019,0.079
27
- Toto-2.0-313m,TimesFM-2.5,0.769,0.615,0.923,0.055,0.019,0.099
28
- Toto-2.0-313m,Moirai-2.0,0.769,0.577,0.923,0.064,0.026,0.103
29
- Toto-2.0-313m,Chronos-Bolt,0.846,0.692,0.962,0.056,0.014,0.105
30
- Toto-2.0-313m,FlowState,0.808,0.654,0.962,0.052,0.012,0.09
31
- Toto-2.0-313m,Sundial-Base,0.769,0.615,0.923,0.034,-0.073,0.132
32
- Toto-2.0-313m,Toto-1.0,0.846,0.692,0.962,0.086,0.056,0.12
33
- Toto-2.0-313m,Seasonal Naive,0.923,0.808,1.0,0.307,0.221,0.386
34
- Toto-2.0-1B,Chronos-2,0.385,0.192,0.577,-0.104,-0.204,-0.02
35
- Toto-2.0-1B,Toto-2.0-313m,0.462,0.269,0.654,0.005,-0.012,0.025
36
- Toto-2.0-1B,Toto-2.0-1B,0.5,0.5,0.5,0.0,0.0,0.0
37
- Toto-2.0-1B,Toto-2.0-2.5B,0.5,0.308,0.692,0.01,-0.003,0.026
38
- Toto-2.0-1B,TiRex-2,0.577,0.385,0.769,-0.052,-0.153,0.034
39
- Toto-2.0-1B,TabPFN-TS-3,0.462,0.269,0.654,-0.055,-0.17,0.057
40
- Toto-2.0-1B,Toto-2.0-22m,0.769,0.577,0.923,0.03,0.006,0.053
41
- Toto-2.0-1B,TabPFN-TS,0.577,0.385,0.769,0.01,-0.1,0.109
42
- Toto-2.0-1B,TiRex,0.769,0.615,0.923,0.051,0.016,0.094
43
- Toto-2.0-1B,TimesFM-2.5,0.808,0.654,0.962,0.06,0.02,0.109
44
- Toto-2.0-1B,Moirai-2.0,0.769,0.577,0.923,0.068,0.029,0.113
45
- Toto-2.0-1B,Chronos-Bolt,0.808,0.654,0.962,0.06,0.011,0.118
46
- Toto-2.0-1B,FlowState,0.769,0.615,0.923,0.057,0.015,0.097
47
- Toto-2.0-1B,Sundial-Base,0.808,0.654,0.962,0.039,-0.069,0.14
48
- Toto-2.0-1B,Toto-1.0,0.808,0.654,0.962,0.09,0.054,0.13
49
- Toto-2.0-1B,Seasonal Naive,0.962,0.885,1.0,0.31,0.223,0.392
50
- Toto-2.0-2.5B,Chronos-2,0.385,0.192,0.577,-0.116,-0.209,-0.031
51
- Toto-2.0-2.5B,Toto-2.0-313m,0.577,0.385,0.769,-0.006,-0.018,0.007
52
- Toto-2.0-2.5B,Toto-2.0-1B,0.5,0.308,0.692,-0.011,-0.027,0.003
53
- Toto-2.0-2.5B,Toto-2.0-2.5B,0.5,0.5,0.5,0.0,0.0,0.0
54
- Toto-2.0-2.5B,TiRex-2,0.577,0.385,0.769,-0.063,-0.16,0.02
55
- Toto-2.0-2.5B,TabPFN-TS-3,0.5,0.346,0.692,-0.066,-0.174,0.041
56
- Toto-2.0-2.5B,Toto-2.0-22m,0.731,0.538,0.885,0.02,0.002,0.037
57
- Toto-2.0-2.5B,TabPFN-TS,0.615,0.423,0.808,-0.001,-0.108,0.094
58
- Toto-2.0-2.5B,TiRex,0.692,0.5,0.885,0.041,0.011,0.077
59
- Toto-2.0-2.5B,TimesFM-2.5,0.692,0.5,0.885,0.05,0.012,0.097
60
- Toto-2.0-2.5B,Moirai-2.0,0.731,0.538,0.885,0.058,0.019,0.099
61
- Toto-2.0-2.5B,Chronos-Bolt,0.808,0.654,0.962,0.05,0.005,0.099
62
- Toto-2.0-2.5B,FlowState,0.769,0.615,0.923,0.047,0.006,0.086
63
- Toto-2.0-2.5B,Sundial-Base,0.731,0.577,0.885,0.028,-0.075,0.128
64
- Toto-2.0-2.5B,Toto-1.0,0.769,0.577,0.923,0.08,0.048,0.119
65
- Toto-2.0-2.5B,Seasonal Naive,0.923,0.808,1.0,0.303,0.219,0.384
66
- TiRex-2,Chronos-2,0.385,0.192,0.577,-0.05,-0.106,-0.002
67
- TiRex-2,Toto-2.0-313m,0.462,0.269,0.654,0.054,-0.029,0.137
68
- TiRex-2,Toto-2.0-1B,0.423,0.231,0.615,0.049,-0.035,0.133
69
- TiRex-2,Toto-2.0-2.5B,0.423,0.231,0.615,0.059,-0.02,0.138
70
- TiRex-2,TiRex-2,0.5,0.5,0.5,0.0,0.0,0.0
71
- TiRex-2,TabPFN-TS-3,0.538,0.346,0.731,-0.003,-0.078,0.069
72
- TiRex-2,Toto-2.0-22m,0.538,0.346,0.731,0.078,0.004,0.154
73
- TiRex-2,TabPFN-TS,0.692,0.5,0.846,0.058,-0.019,0.139
74
- TiRex-2,TiRex,0.577,0.385,0.769,0.098,0.027,0.167
75
- TiRex-2,TimesFM-2.5,0.615,0.423,0.769,0.106,0.033,0.182
76
- TiRex-2,Moirai-2.0,0.731,0.538,0.885,0.114,0.041,0.183
77
- TiRex-2,Chronos-Bolt,0.654,0.462,0.846,0.107,0.025,0.193
78
- TiRex-2,FlowState,0.731,0.538,0.885,0.103,0.027,0.175
79
- TiRex-2,Sundial-Base,0.769,0.615,0.923,0.086,0.001,0.169
80
- TiRex-2,Toto-1.0,0.577,0.385,0.769,0.135,0.059,0.211
81
- TiRex-2,Seasonal Naive,0.962,0.885,1.0,0.344,0.247,0.425
82
- TabPFN-TS-3,Chronos-2,0.269,0.115,0.462,-0.047,-0.11,0.012
83
- TabPFN-TS-3,Toto-2.0-313m,0.423,0.231,0.615,0.056,-0.053,0.148
84
- TabPFN-TS-3,Toto-2.0-1B,0.538,0.346,0.731,0.052,-0.061,0.145
85
- TabPFN-TS-3,Toto-2.0-2.5B,0.5,0.308,0.654,0.062,-0.043,0.148
86
- TabPFN-TS-3,TiRex-2,0.462,0.269,0.654,0.003,-0.074,0.072
87
- TabPFN-TS-3,TabPFN-TS-3,0.5,0.5,0.5,0.0,0.0,0.0
88
- TabPFN-TS-3,Toto-2.0-22m,0.577,0.385,0.769,0.081,-0.016,0.164
89
- TabPFN-TS-3,TabPFN-TS,0.692,0.5,0.846,0.061,-0.003,0.119
90
- TabPFN-TS-3,TiRex,0.538,0.346,0.731,0.1,0.002,0.189
91
- TabPFN-TS-3,TimesFM-2.5,0.577,0.385,0.769,0.109,0.018,0.192
92
- TabPFN-TS-3,Moirai-2.0,0.654,0.462,0.809,0.116,0.015,0.206
93
- TabPFN-TS-3,Chronos-Bolt,0.654,0.462,0.846,0.109,0.021,0.191
94
- TabPFN-TS-3,FlowState,0.654,0.462,0.846,0.106,0.011,0.188
95
- TabPFN-TS-3,Sundial-Base,0.654,0.462,0.846,0.089,0.008,0.164
96
- TabPFN-TS-3,Toto-1.0,0.654,0.462,0.808,0.137,0.046,0.221
97
- TabPFN-TS-3,Seasonal Naive,0.962,0.885,1.0,0.346,0.261,0.422
98
- Toto-2.0-22m,Chronos-2,0.308,0.154,0.5,-0.139,-0.232,-0.057
99
- Toto-2.0-22m,Toto-2.0-313m,0.269,0.115,0.462,-0.027,-0.046,-0.005
100
- Toto-2.0-22m,Toto-2.0-1B,0.231,0.077,0.423,-0.031,-0.055,-0.006
101
- Toto-2.0-22m,Toto-2.0-2.5B,0.269,0.115,0.462,-0.021,-0.039,-0.002
102
- Toto-2.0-22m,TiRex-2,0.462,0.269,0.654,-0.085,-0.181,-0.004
103
- Toto-2.0-22m,TabPFN-TS-3,0.423,0.231,0.615,-0.088,-0.197,0.015
104
- Toto-2.0-22m,Toto-2.0-22m,0.5,0.5,0.5,0.0,0.0,0.0
105
- Toto-2.0-22m,TabPFN-TS,0.5,0.308,0.692,-0.022,-0.126,0.071
106
- Toto-2.0-22m,TiRex,0.5,0.308,0.692,0.021,-0.012,0.058
107
- Toto-2.0-22m,TimesFM-2.5,0.5,0.308,0.692,0.03,-0.011,0.078
108
- Toto-2.0-22m,Moirai-2.0,0.577,0.385,0.769,0.039,-0.002,0.079
109
- Toto-2.0-22m,Chronos-Bolt,0.692,0.5,0.846,0.031,-0.011,0.077
110
- Toto-2.0-22m,FlowState,0.654,0.5,0.808,0.027,-0.018,0.066
111
- Toto-2.0-22m,Sundial-Base,0.615,0.423,0.808,0.008,-0.099,0.104
112
- Toto-2.0-22m,Toto-1.0,0.692,0.5,0.846,0.061,0.032,0.094
113
- Toto-2.0-22m,Seasonal Naive,0.962,0.885,1.0,0.289,0.209,0.365
114
- TabPFN-TS,Chronos-2,0.192,0.077,0.346,-0.115,-0.216,-0.036
115
- TabPFN-TS,Toto-2.0-313m,0.308,0.154,0.5,-0.005,-0.112,0.098
116
- TabPFN-TS,Toto-2.0-1B,0.423,0.231,0.615,-0.01,-0.123,0.091
117
- TabPFN-TS,Toto-2.0-2.5B,0.385,0.192,0.577,0.001,-0.103,0.098
118
- TabPFN-TS,TiRex-2,0.308,0.154,0.5,-0.062,-0.161,0.018
119
- TabPFN-TS,TabPFN-TS-3,0.308,0.154,0.5,-0.065,-0.135,0.003
120
- TabPFN-TS,Toto-2.0-22m,0.5,0.308,0.692,0.021,-0.076,0.112
121
- TabPFN-TS,TabPFN-TS,0.5,0.5,0.5,0.0,0.0,0.0
122
- TabPFN-TS,TiRex,0.462,0.269,0.654,0.042,-0.07,0.138
123
- TabPFN-TS,TimesFM-2.5,0.538,0.346,0.731,0.051,-0.047,0.137
124
- TabPFN-TS,Moirai-2.0,0.538,0.346,0.731,0.059,-0.056,0.163
125
- TabPFN-TS,Chronos-Bolt,0.538,0.346,0.731,0.051,-0.035,0.132
126
- TabPFN-TS,FlowState,0.577,0.385,0.769,0.047,-0.06,0.132
127
- TabPFN-TS,Sundial-Base,0.615,0.423,0.808,0.029,-0.086,0.132
128
- TabPFN-TS,Toto-1.0,0.577,0.385,0.769,0.081,-0.022,0.177
129
- TabPFN-TS,Seasonal Naive,0.962,0.885,1.0,0.304,0.213,0.381
130
- TiRex,Chronos-2,0.154,0.038,0.308,-0.164,-0.256,-0.08
131
- TiRex,Toto-2.0-313m,0.346,0.154,0.538,-0.049,-0.085,-0.019
132
- TiRex,Toto-2.0-1B,0.231,0.077,0.385,-0.054,-0.104,-0.017
133
- TiRex,Toto-2.0-2.5B,0.308,0.115,0.5,-0.043,-0.084,-0.011
134
- TiRex,TiRex-2,0.423,0.231,0.615,-0.108,-0.201,-0.027
135
- TiRex,TabPFN-TS-3,0.462,0.269,0.654,-0.112,-0.233,-0.002
136
- TiRex,Toto-2.0-22m,0.5,0.308,0.692,-0.022,-0.061,0.012
137
- TiRex,TabPFN-TS,0.538,0.346,0.731,-0.044,-0.161,0.065
138
- TiRex,TiRex,0.5,0.5,0.5,0.0,0.0,0.0
139
- TiRex,TimesFM-2.5,0.558,0.365,0.75,0.009,-0.023,0.041
140
- TiRex,Moirai-2.0,0.442,0.269,0.615,0.018,-0.013,0.051
141
- TiRex,Chronos-Bolt,0.481,0.308,0.673,0.01,-0.028,0.06
142
- TiRex,FlowState,0.519,0.346,0.692,0.006,-0.029,0.041
143
- TiRex,Sundial-Base,0.635,0.462,0.808,-0.013,-0.12,0.076
144
- TiRex,Toto-1.0,0.712,0.538,0.885,0.041,0.009,0.076
145
- TiRex,Seasonal Naive,0.885,0.731,1.0,0.273,0.184,0.352
146
- TimesFM-2.5,Chronos-2,0.269,0.115,0.462,-0.175,-0.273,-0.081
147
- TimesFM-2.5,Toto-2.0-313m,0.231,0.077,0.385,-0.058,-0.11,-0.019
148
- TimesFM-2.5,Toto-2.0-1B,0.192,0.038,0.346,-0.063,-0.122,-0.021
149
- TimesFM-2.5,Toto-2.0-2.5B,0.308,0.115,0.5,-0.052,-0.107,-0.012
150
- TimesFM-2.5,TiRex-2,0.385,0.231,0.577,-0.119,-0.222,-0.034
151
- TimesFM-2.5,TabPFN-TS-3,0.423,0.231,0.615,-0.122,-0.238,-0.019
152
- TimesFM-2.5,Toto-2.0-22m,0.5,0.308,0.692,-0.031,-0.085,0.011
153
- TimesFM-2.5,TabPFN-TS,0.462,0.269,0.654,-0.053,-0.159,0.045
154
- TimesFM-2.5,TiRex,0.442,0.25,0.635,-0.009,-0.043,0.023
155
- TimesFM-2.5,TimesFM-2.5,0.5,0.5,0.5,0.0,0.0,0.0
156
- TimesFM-2.5,Moirai-2.0,0.577,0.404,0.75,0.009,-0.046,0.062
157
- TimesFM-2.5,Chronos-Bolt,0.5,0.327,0.674,0.001,-0.039,0.042
158
- TimesFM-2.5,FlowState,0.538,0.365,0.712,-0.003,-0.048,0.038
159
- TimesFM-2.5,Sundial-Base,0.596,0.423,0.788,-0.022,-0.12,0.067
160
- TimesFM-2.5,Toto-1.0,0.654,0.481,0.808,0.032,-0.012,0.081
161
- TimesFM-2.5,Seasonal Naive,0.923,0.808,1.0,0.267,0.184,0.338
162
- Moirai-2.0,Chronos-2,0.115,0.0,0.269,-0.185,-0.284,-0.098
163
- Moirai-2.0,Toto-2.0-313m,0.231,0.077,0.423,-0.068,-0.114,-0.027
164
- Moirai-2.0,Toto-2.0-1B,0.231,0.077,0.423,-0.073,-0.128,-0.029
165
- Moirai-2.0,Toto-2.0-2.5B,0.269,0.115,0.462,-0.062,-0.11,-0.02
166
- Moirai-2.0,TiRex-2,0.269,0.115,0.462,-0.129,-0.223,-0.043
167
- Moirai-2.0,TabPFN-TS-3,0.346,0.191,0.538,-0.132,-0.26,-0.016
168
- Moirai-2.0,Toto-2.0-22m,0.423,0.231,0.615,-0.04,-0.086,0.002
169
- Moirai-2.0,TabPFN-TS,0.462,0.269,0.654,-0.063,-0.195,0.053
170
- Moirai-2.0,TiRex,0.558,0.385,0.731,-0.018,-0.054,0.013
171
- Moirai-2.0,TimesFM-2.5,0.423,0.25,0.596,-0.009,-0.067,0.044
172
- Moirai-2.0,Moirai-2.0,0.5,0.5,0.5,0.0,0.0,0.0
173
- Moirai-2.0,Chronos-Bolt,0.423,0.269,0.596,-0.008,-0.073,0.062
174
- Moirai-2.0,FlowState,0.538,0.365,0.712,-0.012,-0.065,0.03
175
- Moirai-2.0,Sundial-Base,0.596,0.423,0.769,-0.032,-0.143,0.065
176
- Moirai-2.0,Toto-1.0,0.577,0.404,0.75,0.024,-0.008,0.056
177
- Moirai-2.0,Seasonal Naive,0.808,0.654,0.924,0.26,0.164,0.341
178
- Chronos-Bolt,Chronos-2,0.077,0.0,0.192,-0.175,-0.28,-0.089
179
- Chronos-Bolt,Toto-2.0-313m,0.154,0.038,0.308,-0.059,-0.118,-0.014
180
- Chronos-Bolt,Toto-2.0-1B,0.192,0.038,0.346,-0.064,-0.133,-0.011
181
- Chronos-Bolt,Toto-2.0-2.5B,0.192,0.038,0.346,-0.053,-0.109,-0.005
182
- Chronos-Bolt,TiRex-2,0.346,0.154,0.538,-0.119,-0.24,-0.026
183
- Chronos-Bolt,TabPFN-TS-3,0.346,0.154,0.538,-0.123,-0.236,-0.021
184
- Chronos-Bolt,Toto-2.0-22m,0.308,0.154,0.5,-0.032,-0.083,0.011
185
- Chronos-Bolt,TabPFN-TS,0.462,0.269,0.654,-0.054,-0.152,0.034
186
- Chronos-Bolt,TiRex,0.519,0.327,0.692,-0.01,-0.064,0.027
187
- Chronos-Bolt,TimesFM-2.5,0.5,0.326,0.673,-0.001,-0.044,0.038
188
- Chronos-Bolt,Moirai-2.0,0.577,0.404,0.731,0.008,-0.066,0.068
189
- Chronos-Bolt,Chronos-Bolt,0.5,0.5,0.5,0.0,0.0,0.0
190
- Chronos-Bolt,FlowState,0.5,0.327,0.673,-0.004,-0.072,0.041
191
- Chronos-Bolt,Sundial-Base,0.519,0.327,0.692,-0.023,-0.128,0.067
192
- Chronos-Bolt,Toto-1.0,0.615,0.442,0.788,0.032,-0.022,0.08
193
- Chronos-Bolt,Seasonal Naive,0.923,0.808,1.0,0.266,0.183,0.339
194
- FlowState,Chronos-2,0.192,0.077,0.346,-0.171,-0.253,-0.086
195
- FlowState,Toto-2.0-313m,0.192,0.038,0.346,-0.055,-0.098,-0.012
196
- FlowState,Toto-2.0-1B,0.231,0.077,0.385,-0.06,-0.108,-0.016
197
- FlowState,Toto-2.0-2.5B,0.231,0.077,0.385,-0.049,-0.094,-0.006
198
- FlowState,TiRex-2,0.269,0.115,0.462,-0.115,-0.212,-0.027
199
- FlowState,TabPFN-TS-3,0.346,0.154,0.538,-0.118,-0.231,-0.011
200
- FlowState,Toto-2.0-22m,0.346,0.192,0.5,-0.028,-0.07,0.018
201
- FlowState,TabPFN-TS,0.423,0.231,0.615,-0.05,-0.152,0.056
202
- FlowState,TiRex,0.481,0.308,0.654,-0.006,-0.043,0.028
203
- FlowState,TimesFM-2.5,0.462,0.288,0.635,0.003,-0.04,0.046
204
- FlowState,Moirai-2.0,0.462,0.288,0.635,0.012,-0.031,0.061
205
- FlowState,Chronos-Bolt,0.5,0.327,0.673,0.004,-0.043,0.067
206
- FlowState,FlowState,0.5,0.5,0.5,0.0,0.0,0.0
207
- FlowState,Sundial-Base,0.558,0.385,0.75,-0.019,-0.118,0.069
208
- FlowState,Toto-1.0,0.5,0.327,0.692,0.035,-0.006,0.084
209
- FlowState,Seasonal Naive,0.769,0.577,0.923,0.269,0.178,0.347
210
- Sundial-Base,Chronos-2,0.154,0.038,0.308,-0.149,-0.241,-0.077
211
- Sundial-Base,Toto-2.0-313m,0.231,0.077,0.385,-0.035,-0.153,0.068
212
- Sundial-Base,Toto-2.0-1B,0.192,0.038,0.346,-0.04,-0.162,0.064
213
- Sundial-Base,Toto-2.0-2.5B,0.269,0.115,0.423,-0.029,-0.146,0.07
214
- Sundial-Base,TiRex-2,0.231,0.077,0.385,-0.094,-0.203,-0.001
215
- Sundial-Base,TabPFN-TS-3,0.346,0.154,0.538,-0.097,-0.196,-0.008
216
- Sundial-Base,Toto-2.0-22m,0.385,0.192,0.577,-0.008,-0.116,0.09
217
- Sundial-Base,TabPFN-TS,0.385,0.192,0.577,-0.03,-0.153,0.08
218
- Sundial-Base,TiRex,0.365,0.192,0.538,0.013,-0.083,0.107
219
- Sundial-Base,TimesFM-2.5,0.404,0.212,0.577,0.022,-0.072,0.107
220
- Sundial-Base,Moirai-2.0,0.404,0.231,0.577,0.031,-0.069,0.125
221
- Sundial-Base,Chronos-Bolt,0.481,0.308,0.673,0.023,-0.072,0.113
222
- Sundial-Base,FlowState,0.442,0.25,0.615,0.019,-0.074,0.106
223
- Sundial-Base,Sundial-Base,0.5,0.5,0.5,0.0,0.0,0.0
224
- Sundial-Base,Toto-1.0,0.519,0.327,0.712,0.054,-0.039,0.14
225
- Sundial-Base,Seasonal Naive,0.846,0.692,0.962,0.283,0.183,0.364
226
- Toto-1.0,Chronos-2,0.115,0.0,0.231,-0.214,-0.323,-0.123
227
- Toto-1.0,Toto-2.0-313m,0.154,0.038,0.308,-0.094,-0.136,-0.059
228
- Toto-1.0,Toto-2.0-1B,0.192,0.038,0.346,-0.099,-0.15,-0.058
229
- Toto-1.0,Toto-2.0-2.5B,0.231,0.077,0.423,-0.088,-0.135,-0.051
230
- Toto-1.0,TiRex-2,0.423,0.231,0.615,-0.156,-0.268,-0.062
231
- Toto-1.0,TabPFN-TS-3,0.346,0.192,0.538,-0.159,-0.284,-0.048
232
- Toto-1.0,Toto-2.0-22m,0.308,0.154,0.5,-0.065,-0.104,-0.033
233
- Toto-1.0,TabPFN-TS,0.423,0.231,0.615,-0.088,-0.215,0.022
234
- Toto-1.0,TiRex,0.288,0.115,0.462,-0.043,-0.083,-0.009
235
- Toto-1.0,TimesFM-2.5,0.346,0.192,0.519,-0.033,-0.088,0.012
236
- Toto-1.0,Moirai-2.0,0.423,0.25,0.596,-0.024,-0.06,0.008
237
- Toto-1.0,Chronos-Bolt,0.385,0.212,0.558,-0.033,-0.087,0.021
238
- Toto-1.0,FlowState,0.5,0.308,0.673,-0.037,-0.092,0.006
239
- Toto-1.0,Sundial-Base,0.481,0.288,0.673,-0.057,-0.163,0.038
240
- Toto-1.0,Toto-1.0,0.5,0.5,0.5,0.0,0.0,0.0
241
- Toto-1.0,Seasonal Naive,0.846,0.654,0.962,0.242,0.151,0.321
242
- Seasonal Naive,Chronos-2,0.077,0.0,0.192,-0.601,-0.814,-0.393
243
- Seasonal Naive,Toto-2.0-313m,0.077,0.0,0.192,-0.443,-0.63,-0.284
244
- Seasonal Naive,Toto-2.0-1B,0.038,0.0,0.115,-0.45,-0.645,-0.288
245
- Seasonal Naive,Toto-2.0-2.5B,0.077,0.0,0.192,-0.435,-0.623,-0.28
246
- Seasonal Naive,TiRex-2,0.038,0.0,0.115,-0.525,-0.739,-0.328
247
- Seasonal Naive,TabPFN-TS-3,0.038,0.0,0.115,-0.529,-0.73,-0.353
248
- Seasonal Naive,Toto-2.0-22m,0.038,0.0,0.115,-0.406,-0.574,-0.264
249
- Seasonal Naive,TabPFN-TS,0.038,0.0,0.115,-0.436,-0.616,-0.27
250
- Seasonal Naive,TiRex,0.115,0.0,0.269,-0.376,-0.544,-0.225
251
- Seasonal Naive,TimesFM-2.5,0.077,0.0,0.192,-0.363,-0.511,-0.225
252
- Seasonal Naive,Moirai-2.0,0.192,0.076,0.346,-0.351,-0.517,-0.196
253
- Seasonal Naive,Chronos-Bolt,0.077,0.0,0.192,-0.363,-0.513,-0.225
254
- Seasonal Naive,FlowState,0.231,0.077,0.423,-0.368,-0.532,-0.217
255
- Seasonal Naive,Sundial-Base,0.154,0.038,0.308,-0.394,-0.572,-0.225
256
- Seasonal Naive,Toto-1.0,0.154,0.038,0.346,-0.319,-0.473,-0.178
257
- Seasonal Naive,Seasonal Naive,0.5,0.5,0.5,0.0,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_energy/pairwise_WQL.csv DELETED
@@ -1,257 +0,0 @@
1
- model_1,model_2,win_rate,win_rate_lower,win_rate_upper,skill_score,skill_score_lower,skill_score_upper
2
- Chronos-2,Chronos-2,0.5,0.5,0.5,0.0,0.0,0.0
3
- Chronos-2,Toto-2.0-1B,0.5,0.308,0.692,0.085,0.012,0.16
4
- Chronos-2,Toto-2.0-2.5B,0.577,0.385,0.769,0.096,0.024,0.164
5
- Chronos-2,Toto-2.0-313m,0.538,0.346,0.731,0.093,0.022,0.164
6
- Chronos-2,TiRex-2,0.577,0.385,0.769,0.045,-0.001,0.094
7
- Chronos-2,TabPFN-TS-3,0.692,0.5,0.846,0.051,-0.003,0.106
8
- Chronos-2,Toto-2.0-22m,0.692,0.5,0.846,0.122,0.052,0.188
9
- Chronos-2,TiRex,0.808,0.654,0.962,0.143,0.076,0.204
10
- Chronos-2,TabPFN-TS,0.846,0.692,0.962,0.105,0.046,0.172
11
- Chronos-2,TimesFM-2.5,0.808,0.654,0.962,0.159,0.086,0.224
12
- Chronos-2,FlowState,0.846,0.692,0.962,0.166,0.098,0.224
13
- Chronos-2,Chronos-Bolt,0.962,0.885,1.0,0.165,0.099,0.23
14
- Chronos-2,Moirai-2.0,0.923,0.808,1.0,0.175,0.108,0.243
15
- Chronos-2,Toto-1.0,0.885,0.769,1.0,0.186,0.119,0.252
16
- Chronos-2,Toto-2.0-4m,0.962,0.885,1.0,0.183,0.114,0.247
17
- Chronos-2,Seasonal Naive,1.0,1.0,1.0,0.46,0.384,0.522
18
- Toto-2.0-1B,Chronos-2,0.5,0.308,0.692,-0.093,-0.19,-0.012
19
- Toto-2.0-1B,Toto-2.0-1B,0.5,0.5,0.5,0.0,0.0,0.0
20
- Toto-2.0-1B,Toto-2.0-2.5B,0.654,0.462,0.808,0.012,-0.002,0.029
21
- Toto-2.0-1B,Toto-2.0-313m,0.5,0.308,0.692,0.009,-0.011,0.036
22
- Toto-2.0-1B,TiRex-2,0.577,0.385,0.769,-0.044,-0.148,0.041
23
- Toto-2.0-1B,TabPFN-TS-3,0.5,0.308,0.692,-0.038,-0.155,0.074
24
- Toto-2.0-1B,Toto-2.0-22m,0.885,0.731,1.0,0.04,0.019,0.065
25
- Toto-2.0-1B,TiRex,0.731,0.577,0.885,0.063,0.022,0.115
26
- Toto-2.0-1B,TabPFN-TS,0.654,0.462,0.808,0.022,-0.085,0.112
27
- Toto-2.0-1B,TimesFM-2.5,0.846,0.692,0.962,0.081,0.037,0.131
28
- Toto-2.0-1B,FlowState,0.808,0.654,0.962,0.088,0.047,0.131
29
- Toto-2.0-1B,Chronos-Bolt,0.923,0.808,1.0,0.087,0.036,0.138
30
- Toto-2.0-1B,Moirai-2.0,0.846,0.692,0.962,0.098,0.054,0.147
31
- Toto-2.0-1B,Toto-1.0,0.962,0.885,1.0,0.11,0.074,0.153
32
- Toto-2.0-1B,Toto-2.0-4m,0.962,0.885,1.0,0.107,0.065,0.155
33
- Toto-2.0-1B,Seasonal Naive,1.0,1.0,1.0,0.41,0.333,0.481
34
- Toto-2.0-2.5B,Chronos-2,0.423,0.231,0.615,-0.106,-0.196,-0.025
35
- Toto-2.0-2.5B,Toto-2.0-1B,0.346,0.192,0.538,-0.012,-0.03,0.002
36
- Toto-2.0-2.5B,Toto-2.0-2.5B,0.5,0.5,0.5,0.0,0.0,0.0
37
- Toto-2.0-2.5B,Toto-2.0-313m,0.615,0.423,0.769,-0.003,-0.018,0.012
38
- Toto-2.0-2.5B,TiRex-2,0.538,0.346,0.731,-0.056,-0.158,0.027
39
- Toto-2.0-2.5B,TabPFN-TS-3,0.5,0.308,0.692,-0.05,-0.161,0.059
40
- Toto-2.0-2.5B,Toto-2.0-22m,0.769,0.615,0.923,0.028,0.011,0.045
41
- Toto-2.0-2.5B,TiRex,0.769,0.615,0.923,0.051,0.016,0.092
42
- Toto-2.0-2.5B,TabPFN-TS,0.692,0.538,0.846,0.01,-0.093,0.098
43
- Toto-2.0-2.5B,TimesFM-2.5,0.769,0.615,0.923,0.07,0.031,0.118
44
- Toto-2.0-2.5B,FlowState,0.846,0.692,0.962,0.077,0.036,0.12
45
- Toto-2.0-2.5B,Chronos-Bolt,0.846,0.692,0.962,0.076,0.031,0.122
46
- Toto-2.0-2.5B,Moirai-2.0,0.808,0.654,0.923,0.087,0.046,0.133
47
- Toto-2.0-2.5B,Toto-1.0,0.923,0.808,1.0,0.099,0.067,0.137
48
- Toto-2.0-2.5B,Toto-2.0-4m,0.846,0.692,0.962,0.096,0.057,0.137
49
- Toto-2.0-2.5B,Seasonal Naive,1.0,1.0,1.0,0.403,0.329,0.473
50
- Toto-2.0-313m,Chronos-2,0.462,0.269,0.654,-0.103,-0.196,-0.022
51
- Toto-2.0-313m,Toto-2.0-1B,0.5,0.308,0.692,-0.009,-0.037,0.011
52
- Toto-2.0-313m,Toto-2.0-2.5B,0.385,0.231,0.577,0.003,-0.012,0.018
53
- Toto-2.0-313m,Toto-2.0-313m,0.5,0.5,0.5,0.0,0.0,0.0
54
- Toto-2.0-313m,TiRex-2,0.538,0.346,0.731,-0.053,-0.156,0.03
55
- Toto-2.0-313m,TabPFN-TS-3,0.5,0.308,0.692,-0.047,-0.16,0.066
56
- Toto-2.0-313m,Toto-2.0-22m,0.846,0.692,0.962,0.031,0.014,0.049
57
- Toto-2.0-313m,TiRex,0.769,0.615,0.923,0.054,0.021,0.09
58
- Toto-2.0-313m,TabPFN-TS,0.654,0.462,0.846,0.013,-0.097,0.104
59
- Toto-2.0-313m,TimesFM-2.5,0.769,0.615,0.923,0.073,0.032,0.121
60
- Toto-2.0-313m,FlowState,0.808,0.654,0.962,0.08,0.042,0.122
61
- Toto-2.0-313m,Chronos-Bolt,0.846,0.692,0.962,0.079,0.033,0.131
62
- Toto-2.0-313m,Moirai-2.0,0.808,0.654,0.924,0.09,0.047,0.134
63
- Toto-2.0-313m,Toto-1.0,0.885,0.769,1.0,0.102,0.071,0.134
64
- Toto-2.0-313m,Toto-2.0-4m,0.923,0.808,1.0,0.099,0.061,0.139
65
- Toto-2.0-313m,Seasonal Naive,1.0,1.0,1.0,0.404,0.333,0.471
66
- TiRex-2,Chronos-2,0.423,0.231,0.615,-0.047,-0.104,0.001
67
- TiRex-2,Toto-2.0-1B,0.423,0.231,0.615,0.042,-0.043,0.129
68
- TiRex-2,Toto-2.0-2.5B,0.462,0.269,0.654,0.053,-0.028,0.137
69
- TiRex-2,Toto-2.0-313m,0.462,0.269,0.654,0.05,-0.031,0.135
70
- TiRex-2,TiRex-2,0.5,0.5,0.5,0.0,0.0,0.0
71
- TiRex-2,TabPFN-TS-3,0.5,0.308,0.692,0.006,-0.078,0.082
72
- TiRex-2,Toto-2.0-22m,0.5,0.308,0.692,0.08,0.002,0.161
73
- TiRex-2,TiRex,0.615,0.423,0.808,0.102,0.031,0.173
74
- TiRex-2,TabPFN-TS,0.615,0.423,0.808,0.063,-0.006,0.135
75
- TiRex-2,TimesFM-2.5,0.731,0.538,0.885,0.12,0.044,0.196
76
- TiRex-2,FlowState,0.808,0.654,0.923,0.126,0.052,0.194
77
- TiRex-2,Chronos-Bolt,0.808,0.654,0.962,0.125,0.045,0.209
78
- TiRex-2,Moirai-2.0,0.808,0.654,0.962,0.136,0.067,0.203
79
- TiRex-2,Toto-1.0,0.769,0.615,0.923,0.147,0.069,0.224
80
- TiRex-2,Toto-2.0-4m,0.846,0.692,0.962,0.144,0.068,0.221
81
- TiRex-2,Seasonal Naive,1.0,1.0,1.0,0.434,0.355,0.506
82
- TabPFN-TS-3,Chronos-2,0.308,0.154,0.5,-0.053,-0.119,0.003
83
- TabPFN-TS-3,Toto-2.0-1B,0.5,0.308,0.692,0.036,-0.08,0.134
84
- TabPFN-TS-3,Toto-2.0-2.5B,0.5,0.308,0.692,0.048,-0.063,0.139
85
- TabPFN-TS-3,Toto-2.0-313m,0.5,0.308,0.692,0.045,-0.071,0.138
86
- TabPFN-TS-3,TiRex-2,0.5,0.308,0.692,-0.006,-0.089,0.073
87
- TabPFN-TS-3,TabPFN-TS-3,0.5,0.5,0.5,0.0,0.0,0.0
88
- TabPFN-TS-3,Toto-2.0-22m,0.577,0.385,0.769,0.075,-0.031,0.163
89
- TabPFN-TS-3,TiRex,0.538,0.346,0.731,0.097,-0.002,0.184
90
- TabPFN-TS-3,TabPFN-TS,0.769,0.615,0.923,0.057,-0.009,0.113
91
- TabPFN-TS-3,TimesFM-2.5,0.615,0.423,0.808,0.114,0.023,0.198
92
- TabPFN-TS-3,FlowState,0.731,0.538,0.885,0.121,0.019,0.206
93
- TabPFN-TS-3,Chronos-Bolt,0.731,0.577,0.885,0.12,0.034,0.196
94
- TabPFN-TS-3,Moirai-2.0,0.654,0.462,0.846,0.131,0.027,0.222
95
- TabPFN-TS-3,Toto-1.0,0.654,0.462,0.808,0.142,0.045,0.231
96
- TabPFN-TS-3,Toto-2.0-4m,0.692,0.5,0.846,0.139,0.049,0.221
97
- TabPFN-TS-3,Seasonal Naive,1.0,1.0,1.0,0.431,0.357,0.498
98
- Toto-2.0-22m,Chronos-2,0.308,0.154,0.5,-0.139,-0.231,-0.055
99
- Toto-2.0-22m,Toto-2.0-1B,0.115,0.0,0.269,-0.042,-0.07,-0.019
100
- Toto-2.0-22m,Toto-2.0-2.5B,0.231,0.077,0.385,-0.029,-0.047,-0.011
101
- Toto-2.0-22m,Toto-2.0-313m,0.154,0.038,0.308,-0.032,-0.052,-0.014
102
- Toto-2.0-22m,TiRex-2,0.5,0.308,0.692,-0.087,-0.192,-0.002
103
- Toto-2.0-22m,TabPFN-TS-3,0.423,0.231,0.615,-0.081,-0.195,0.03
104
- Toto-2.0-22m,Toto-2.0-22m,0.5,0.5,0.5,0.0,0.0,0.0
105
- Toto-2.0-22m,TiRex,0.5,0.308,0.692,0.024,-0.012,0.064
106
- Toto-2.0-22m,TabPFN-TS,0.5,0.308,0.692,-0.019,-0.126,0.073
107
- Toto-2.0-22m,TimesFM-2.5,0.654,0.462,0.846,0.043,0.0,0.09
108
- Toto-2.0-22m,FlowState,0.769,0.615,0.923,0.05,0.007,0.089
109
- Toto-2.0-22m,Chronos-Bolt,0.769,0.615,0.923,0.049,0.002,0.098
110
- Toto-2.0-22m,Moirai-2.0,0.731,0.538,0.885,0.061,0.018,0.104
111
- Toto-2.0-22m,Toto-1.0,0.846,0.692,0.962,0.073,0.047,0.104
112
- Toto-2.0-22m,Toto-2.0-4m,0.808,0.654,0.962,0.069,0.038,0.103
113
- Toto-2.0-22m,Seasonal Naive,1.0,1.0,1.0,0.385,0.315,0.453
114
- TiRex,Chronos-2,0.192,0.038,0.346,-0.166,-0.256,-0.083
115
- TiRex,Toto-2.0-1B,0.269,0.115,0.423,-0.067,-0.129,-0.023
116
- TiRex,Toto-2.0-2.5B,0.231,0.077,0.385,-0.054,-0.102,-0.016
117
- TiRex,Toto-2.0-313m,0.231,0.077,0.385,-0.057,-0.099,-0.021
118
- TiRex,TiRex-2,0.385,0.192,0.577,-0.113,-0.209,-0.032
119
- TiRex,TabPFN-TS-3,0.462,0.269,0.654,-0.107,-0.225,0.002
120
- TiRex,Toto-2.0-22m,0.5,0.308,0.692,-0.024,-0.068,0.012
121
- TiRex,TiRex,0.5,0.5,0.5,0.0,0.0,0.0
122
- TiRex,TabPFN-TS,0.5,0.308,0.692,-0.043,-0.153,0.057
123
- TiRex,TimesFM-2.5,0.673,0.5,0.846,0.02,-0.015,0.053
124
- TiRex,FlowState,0.596,0.404,0.769,0.027,-0.013,0.066
125
- TiRex,Chronos-Bolt,0.712,0.538,0.865,0.026,-0.018,0.077
126
- TiRex,Moirai-2.0,0.75,0.577,0.904,0.038,0.007,0.071
127
- TiRex,Toto-1.0,0.788,0.635,0.942,0.05,0.022,0.081
128
- TiRex,Toto-2.0-4m,0.769,0.614,0.923,0.047,0.012,0.079
129
- TiRex,Seasonal Naive,1.0,1.0,1.0,0.37,0.299,0.439
130
- TabPFN-TS,Chronos-2,0.154,0.038,0.308,-0.118,-0.207,-0.048
131
- TabPFN-TS,Toto-2.0-1B,0.346,0.192,0.538,-0.022,-0.126,0.078
132
- TabPFN-TS,Toto-2.0-2.5B,0.308,0.154,0.462,-0.01,-0.109,0.085
133
- TabPFN-TS,Toto-2.0-313m,0.346,0.154,0.538,-0.013,-0.116,0.088
134
- TabPFN-TS,TiRex-2,0.385,0.192,0.577,-0.067,-0.156,0.006
135
- TabPFN-TS,TabPFN-TS-3,0.231,0.077,0.385,-0.061,-0.128,0.009
136
- TabPFN-TS,Toto-2.0-22m,0.5,0.308,0.692,0.018,-0.078,0.112
137
- TabPFN-TS,TiRex,0.5,0.308,0.692,0.042,-0.06,0.132
138
- TabPFN-TS,TabPFN-TS,0.5,0.5,0.5,0.0,0.0,0.0
139
- TabPFN-TS,TimesFM-2.5,0.538,0.346,0.731,0.061,-0.032,0.147
140
- TabPFN-TS,FlowState,0.577,0.385,0.769,0.068,-0.037,0.15
141
- TabPFN-TS,Chronos-Bolt,0.577,0.385,0.769,0.066,-0.013,0.144
142
- TabPFN-TS,Moirai-2.0,0.615,0.423,0.808,0.078,-0.027,0.177
143
- TabPFN-TS,Toto-1.0,0.577,0.385,0.769,0.09,-0.012,0.186
144
- TabPFN-TS,Toto-2.0-4m,0.615,0.423,0.808,0.087,-0.017,0.179
145
- TabPFN-TS,Seasonal Naive,1.0,1.0,1.0,0.396,0.322,0.469
146
- TimesFM-2.5,Chronos-2,0.192,0.038,0.346,-0.19,-0.289,-0.094
147
- TimesFM-2.5,Toto-2.0-1B,0.154,0.038,0.308,-0.088,-0.15,-0.039
148
- TimesFM-2.5,Toto-2.0-2.5B,0.231,0.077,0.385,-0.075,-0.134,-0.032
149
- TimesFM-2.5,Toto-2.0-313m,0.231,0.077,0.385,-0.079,-0.137,-0.033
150
- TimesFM-2.5,TiRex-2,0.269,0.115,0.462,-0.136,-0.244,-0.046
151
- TimesFM-2.5,TabPFN-TS-3,0.385,0.192,0.577,-0.129,-0.247,-0.023
152
- TimesFM-2.5,Toto-2.0-22m,0.346,0.154,0.538,-0.045,-0.098,-0.0
153
- TimesFM-2.5,TiRex,0.327,0.154,0.5,-0.02,-0.056,0.015
154
- TimesFM-2.5,TabPFN-TS,0.462,0.269,0.654,-0.064,-0.172,0.031
155
- TimesFM-2.5,TimesFM-2.5,0.5,0.5,0.5,0.0,0.0,0.0
156
- TimesFM-2.5,FlowState,0.538,0.365,0.712,0.008,-0.042,0.052
157
- TimesFM-2.5,Chronos-Bolt,0.577,0.404,0.75,0.006,-0.031,0.046
158
- TimesFM-2.5,Moirai-2.0,0.615,0.442,0.788,0.018,-0.038,0.072
159
- TimesFM-2.5,Toto-1.0,0.654,0.481,0.808,0.031,-0.017,0.08
160
- TimesFM-2.5,Toto-2.0-4m,0.615,0.423,0.808,0.028,-0.014,0.068
161
- TimesFM-2.5,Seasonal Naive,1.0,1.0,1.0,0.357,0.288,0.423
162
- FlowState,Chronos-2,0.154,0.038,0.308,-0.199,-0.288,-0.109
163
- FlowState,Toto-2.0-1B,0.192,0.038,0.346,-0.097,-0.151,-0.049
164
- FlowState,Toto-2.0-2.5B,0.154,0.038,0.308,-0.084,-0.136,-0.038
165
- FlowState,Toto-2.0-313m,0.192,0.038,0.346,-0.087,-0.139,-0.043
166
- FlowState,TiRex-2,0.192,0.077,0.346,-0.145,-0.241,-0.055
167
- FlowState,TabPFN-TS-3,0.269,0.115,0.462,-0.138,-0.259,-0.02
168
- FlowState,Toto-2.0-22m,0.231,0.077,0.385,-0.053,-0.098,-0.007
169
- FlowState,TiRex,0.404,0.231,0.596,-0.028,-0.071,0.013
170
- FlowState,TabPFN-TS,0.423,0.231,0.615,-0.073,-0.177,0.036
171
- FlowState,TimesFM-2.5,0.462,0.288,0.635,-0.008,-0.055,0.04
172
- FlowState,FlowState,0.5,0.5,0.5,0.0,0.0,0.0
173
- FlowState,Chronos-Bolt,0.5,0.326,0.674,-0.002,-0.052,0.067
174
- FlowState,Moirai-2.0,0.538,0.365,0.712,0.011,-0.039,0.061
175
- FlowState,Toto-1.0,0.462,0.288,0.635,0.023,-0.024,0.072
176
- FlowState,Toto-2.0-4m,0.538,0.346,0.731,0.02,-0.033,0.065
177
- FlowState,Seasonal Naive,0.923,0.808,1.0,0.352,0.275,0.427
178
- Chronos-Bolt,Chronos-2,0.038,0.0,0.115,-0.197,-0.299,-0.11
179
- Chronos-Bolt,Toto-2.0-1B,0.077,0.0,0.192,-0.095,-0.16,-0.038
180
- Chronos-Bolt,Toto-2.0-2.5B,0.154,0.038,0.308,-0.082,-0.139,-0.032
181
- Chronos-Bolt,Toto-2.0-313m,0.154,0.038,0.308,-0.085,-0.15,-0.035
182
- Chronos-Bolt,TiRex-2,0.192,0.038,0.346,-0.143,-0.264,-0.047
183
- Chronos-Bolt,TabPFN-TS-3,0.269,0.115,0.423,-0.136,-0.244,-0.035
184
- Chronos-Bolt,Toto-2.0-22m,0.231,0.077,0.385,-0.051,-0.108,-0.002
185
- Chronos-Bolt,TiRex,0.288,0.135,0.462,-0.027,-0.084,0.018
186
- Chronos-Bolt,TabPFN-TS,0.423,0.231,0.615,-0.071,-0.168,0.013
187
- Chronos-Bolt,TimesFM-2.5,0.423,0.25,0.596,-0.006,-0.048,0.03
188
- Chronos-Bolt,FlowState,0.5,0.326,0.674,0.002,-0.072,0.05
189
- Chronos-Bolt,Chronos-Bolt,0.5,0.5,0.5,0.0,0.0,0.0
190
- Chronos-Bolt,Moirai-2.0,0.462,0.308,0.635,0.012,-0.062,0.076
191
- Chronos-Bolt,Toto-1.0,0.615,0.442,0.769,0.025,-0.03,0.078
192
- Chronos-Bolt,Toto-2.0-4m,0.615,0.423,0.77,0.022,-0.038,0.07
193
- Chronos-Bolt,Seasonal Naive,1.0,1.0,1.0,0.353,0.287,0.417
194
- Moirai-2.0,Chronos-2,0.077,0.0,0.192,-0.212,-0.32,-0.122
195
- Moirai-2.0,Toto-2.0-1B,0.154,0.038,0.308,-0.109,-0.173,-0.057
196
- Moirai-2.0,Toto-2.0-2.5B,0.192,0.077,0.346,-0.096,-0.154,-0.048
197
- Moirai-2.0,Toto-2.0-313m,0.192,0.076,0.346,-0.099,-0.154,-0.05
198
- Moirai-2.0,TiRex-2,0.192,0.038,0.346,-0.157,-0.255,-0.072
199
- Moirai-2.0,TabPFN-TS-3,0.346,0.154,0.538,-0.151,-0.285,-0.028
200
- Moirai-2.0,Toto-2.0-22m,0.269,0.115,0.462,-0.064,-0.116,-0.018
201
- Moirai-2.0,TiRex,0.25,0.096,0.423,-0.039,-0.077,-0.007
202
- Moirai-2.0,TabPFN-TS,0.385,0.192,0.577,-0.084,-0.216,0.026
203
- Moirai-2.0,TimesFM-2.5,0.385,0.212,0.558,-0.019,-0.077,0.037
204
- Moirai-2.0,FlowState,0.462,0.288,0.635,-0.011,-0.066,0.037
205
- Moirai-2.0,Chronos-Bolt,0.538,0.365,0.692,-0.012,-0.082,0.058
206
- Moirai-2.0,Moirai-2.0,0.5,0.5,0.5,0.0,0.0,0.0
207
- Moirai-2.0,Toto-1.0,0.538,0.365,0.712,0.013,-0.016,0.045
208
- Moirai-2.0,Toto-2.0-4m,0.538,0.346,0.731,0.009,-0.03,0.051
209
- Moirai-2.0,Seasonal Naive,0.923,0.808,1.0,0.345,0.266,0.421
210
- Toto-1.0,Chronos-2,0.115,0.0,0.231,-0.228,-0.337,-0.135
211
- Toto-1.0,Toto-2.0-1B,0.038,0.0,0.115,-0.123,-0.18,-0.08
212
- Toto-1.0,Toto-2.0-2.5B,0.077,0.0,0.192,-0.11,-0.158,-0.072
213
- Toto-1.0,Toto-2.0-313m,0.115,0.0,0.231,-0.113,-0.155,-0.077
214
- Toto-1.0,TiRex-2,0.231,0.077,0.385,-0.172,-0.289,-0.074
215
- Toto-1.0,TabPFN-TS-3,0.346,0.192,0.538,-0.166,-0.3,-0.047
216
- Toto-1.0,Toto-2.0-22m,0.154,0.038,0.308,-0.078,-0.117,-0.049
217
- Toto-1.0,TiRex,0.212,0.058,0.365,-0.053,-0.088,-0.023
218
- Toto-1.0,TabPFN-TS,0.423,0.231,0.615,-0.099,-0.228,0.012
219
- Toto-1.0,TimesFM-2.5,0.346,0.192,0.519,-0.032,-0.087,0.017
220
- Toto-1.0,FlowState,0.538,0.365,0.712,-0.024,-0.078,0.023
221
- Toto-1.0,Chronos-Bolt,0.385,0.231,0.558,-0.026,-0.085,0.029
222
- Toto-1.0,Moirai-2.0,0.462,0.288,0.635,-0.013,-0.047,0.016
223
- Toto-1.0,Toto-1.0,0.5,0.5,0.5,0.0,0.0,0.0
224
- Toto-1.0,Toto-2.0-4m,0.577,0.385,0.731,-0.004,-0.04,0.026
225
- Toto-1.0,Seasonal Naive,0.962,0.885,1.0,0.337,0.259,0.412
226
- Toto-2.0-4m,Chronos-2,0.038,0.0,0.115,-0.224,-0.327,-0.128
227
- Toto-2.0-4m,Toto-2.0-1B,0.038,0.0,0.115,-0.119,-0.184,-0.069
228
- Toto-2.0-4m,Toto-2.0-2.5B,0.154,0.038,0.308,-0.106,-0.159,-0.06
229
- Toto-2.0-4m,Toto-2.0-313m,0.077,0.0,0.192,-0.109,-0.161,-0.065
230
- Toto-2.0-4m,TiRex-2,0.154,0.038,0.308,-0.168,-0.283,-0.072
231
- Toto-2.0-4m,TabPFN-TS-3,0.308,0.154,0.5,-0.161,-0.283,-0.052
232
- Toto-2.0-4m,Toto-2.0-22m,0.192,0.038,0.346,-0.075,-0.115,-0.039
233
- Toto-2.0-4m,TiRex,0.231,0.077,0.386,-0.049,-0.086,-0.012
234
- Toto-2.0-4m,TabPFN-TS,0.385,0.192,0.577,-0.095,-0.218,0.017
235
- Toto-2.0-4m,TimesFM-2.5,0.385,0.192,0.577,-0.028,-0.073,0.014
236
- Toto-2.0-4m,FlowState,0.462,0.269,0.654,-0.02,-0.07,0.032
237
- Toto-2.0-4m,Chronos-Bolt,0.385,0.23,0.577,-0.022,-0.075,0.036
238
- Toto-2.0-4m,Moirai-2.0,0.462,0.269,0.654,-0.01,-0.053,0.029
239
- Toto-2.0-4m,Toto-1.0,0.423,0.269,0.615,0.004,-0.027,0.038
240
- Toto-2.0-4m,Toto-2.0-4m,0.5,0.5,0.5,0.0,0.0,0.0
241
- Toto-2.0-4m,Seasonal Naive,1.0,1.0,1.0,0.339,0.27,0.408
242
- Seasonal Naive,Chronos-2,0.0,0.0,0.0,-0.852,-1.093,-0.622
243
- Seasonal Naive,Toto-2.0-1B,0.0,0.0,0.0,-0.694,-0.927,-0.5
244
- Seasonal Naive,Toto-2.0-2.5B,0.0,0.0,0.0,-0.674,-0.899,-0.491
245
- Seasonal Naive,Toto-2.0-313m,0.0,0.0,0.0,-0.679,-0.891,-0.5
246
- Seasonal Naive,TiRex-2,0.0,0.0,0.0,-0.768,-1.023,-0.55
247
- Seasonal Naive,TabPFN-TS-3,0.0,0.0,0.0,-0.758,-0.992,-0.556
248
- Seasonal Naive,Toto-2.0-22m,0.0,0.0,0.0,-0.626,-0.83,-0.46
249
- Seasonal Naive,TiRex,0.0,0.0,0.0,-0.588,-0.782,-0.427
250
- Seasonal Naive,TabPFN-TS,0.0,0.0,0.0,-0.657,-0.882,-0.476
251
- Seasonal Naive,TimesFM-2.5,0.0,0.0,0.0,-0.556,-0.734,-0.404
252
- Seasonal Naive,FlowState,0.077,0.0,0.192,-0.544,-0.745,-0.38
253
- Seasonal Naive,Chronos-Bolt,0.0,0.0,0.0,-0.547,-0.716,-0.403
254
- Seasonal Naive,Moirai-2.0,0.077,0.0,0.192,-0.528,-0.727,-0.362
255
- Seasonal Naive,Toto-1.0,0.038,0.0,0.115,-0.508,-0.7,-0.35
256
- Seasonal Naive,Toto-2.0-4m,0.0,0.0,0.0,-0.513,-0.688,-0.369
257
- Seasonal Naive,Seasonal Naive,0.5,0.5,0.5,0.0,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_health/leaderboard_MASE.csv DELETED
@@ -1,29 +0,0 @@
1
- model_name,win_rate,skill_score,median_training_time_s_per100,median_inference_time_s_per100,training_corpus_overlap,num_failures
2
- TiRex-2,80.37037037037038,34.9166343514373,0.0,0.3575023838736039,0.0,0.0
3
- TimesFM-2.5,70.37037037037038,32.87474894024488,0.0,1.1256479395833334,0.0,0.0
4
- Chronos-2,68.88888888888891,31.78597649489514,0.0,0.3492251116666667,0.0,0.0
5
- TabPFN-TS-3,68.51851851851852,28.963255047296542,0.0,199.6776895770319,0.0,0.0
6
- TabPFN-TS,66.66666666666666,34.55373879766452,0.0,53.951610824166664,0.0,0.0
7
- TiRex,65.18518518518519,32.47588770643868,0.0,0.330588668125,0.0,0.0
8
- FlowState,63.33333333333334,27.93729353213241,0.0,1.679734656979167,0.0,0.0
9
- LightGBM,62.96296296296296,33.38915880315173,1.2161332720833333,0.19742606979166666,0.0,0.0
10
- CatBoost,62.22222222222222,33.16623383500657,13.210264008932292,0.19426541770833333,0.0,0.0
11
- Moirai-2.0,62.03703703703704,33.79488506711863,0.0,0.3505868739583333,0.1,0.0
12
- Toto-2.0-313m,60.74074074074075,27.130941962281884,0.0,1.1242909435416668,0.0,0.0
13
- Toto-2.0-2.5B,60.74074074074075,27.02155839964281,0.0,5.925324101666666,0.0,0.0
14
- Toto-2.0-1B,56.666666666666664,26.055688762834595,0.0,2.728815209166667,0.0,0.0
15
- Toto-2.0-22m,56.2962962962963,27.354995059689568,0.0,0.4238227016666667,0.0,0.0
16
- Toto-1.0,55.18518518518518,31.700573837170467,0.0,9.804296426666667,0.0,0.0
17
- Chronos-Bolt,54.629629629629626,30.041136052707273,0.0,0.41178704374999997,0.0,0.0
18
- Toto-2.0-4m,54.07407407407408,28.997499277709025,0.0,0.36290417583333334,0.0,0.0
19
- AutoETS,48.14814814814816,28.071655328734924,0.0,2.5273205354166666,0.0,0.0
20
- Stat. Ensemble,48.148148148148145,29.22979017092695,0.0,191.30953815208332,0.0,0.0
21
- Sundial-Base,44.81481481481482,22.70787609837541,0.0,8.29280267,0.0,0.0
22
- AutoARIMA,32.59259259259259,5.881738752268506,0.0,7.6933014760416665,0.0,0.0
23
- TFT,28.888888888888886,8.056299346355855,577.3621929408333,0.91290832015625,0.0,0.0
24
- AutoTheta,26.666666666666668,15.20916710141943,0.0,2.3246237520833333,0.0,0.0
25
- DeepAR,23.333333333333336,8.848833829469338,1252.3585836206248,0.9790481578125001,0.0,0.0
26
- PatchTST,22.592592592592585,12.927869318522445,812.3820815818749,0.4485787422916667,0.0,0.0
27
- Seasonal Naive,20.185185185185187,0.0,0.0,1.2681127877083334,0.0,0.0
28
- Naive,17.962962962962962,0.30982947391161586,0.0,1.2969351423177082,0.0,0.0
29
- Drift,17.77777777777778,7.491051482058886,0.0,1.3917920932291667,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_health/leaderboard_SQL.csv DELETED
@@ -1,29 +0,0 @@
1
- model_name,win_rate,skill_score,median_training_time_s_per100,median_inference_time_s_per100,training_corpus_overlap,num_failures
2
- TiRex-2,84.44444444444444,39.425727939082535,0.0,0.3575023838736039,0.0,0.0
3
- Chronos-2,78.51851851851852,38.08875531260849,0.0,0.3492251116666667,0.0,0.0
4
- TimesFM-2.5,73.33333333333336,38.03594071146331,0.0,1.1256479395833334,0.0,0.0
5
- Toto-2.0-313m,68.51851851851852,33.76977925435224,0.0,1.1242909435416668,0.0,0.0
6
- Moirai-2.0,67.5925925925926,38.69101646514035,0.0,0.3505868739583333,0.1,0.0
7
- TabPFN-TS,66.66666666666666,37.79500412291329,0.0,53.951610824166664,0.0,0.0
8
- Toto-2.0-2.5B,65.92592592592594,33.54660585794915,0.0,5.925324101666666,0.0,0.0
9
- TiRex,65.55555555555556,36.908809542631595,0.0,0.330588668125,0.0,0.0
10
- TabPFN-TS-3,64.81481481481482,33.86938070997042,0.0,199.6776895770319,0.0,0.0
11
- Toto-1.0,63.703703703703695,37.78506660666954,0.0,9.804296426666667,0.0,0.0
12
- Toto-2.0-1B,62.5925925925926,32.77732666419397,0.0,2.728815209166667,0.0,0.0
13
- Toto-2.0-22m,62.22222222222222,33.710262442699914,0.0,0.4238227016666667,0.0,0.0
14
- Chronos-Bolt,61.66666666666666,36.49963478571547,0.0,0.41178704374999997,0.0,0.0
15
- FlowState,57.03703703703704,32.77403706037661,0.0,1.679734656979167,0.0,0.0
16
- Toto-2.0-4m,55.18518518518518,34.41096517434523,0.0,0.36290417583333334,0.0,0.0
17
- AutoETS,52.22222222222223,31.12404358258436,0.0,2.5273205354166666,0.0,0.0
18
- Stat. Ensemble,46.666666666666664,31.666899122864876,0.0,191.30953815208332,0.0,0.0
19
- LightGBM,41.851851851851855,24.996902028028057,1.2161332720833333,0.19742606979166666,0.0,0.0
20
- CatBoost,37.77777777777778,24.745890887412404,13.210264008932292,0.19426541770833333,0.0,0.0
21
- Sundial-Base,36.29629629629629,23.555776042271713,0.0,8.29280267,0.0,0.0
22
- AutoARIMA,33.33333333333333,8.15543220497067,0.0,7.6933014760416665,0.0,0.0
23
- TFT,32.59259259259259,13.487049535026774,577.3621929408333,0.91290832015625,0.0,0.0
24
- PatchTST,25.925925925925924,17.70708962424181,812.3820815818749,0.4485787422916667,0.0,0.0
25
- AutoTheta,25.185185185185183,17.733419411019135,0.0,2.3246237520833333,0.0,0.0
26
- DeepAR,22.962962962962962,13.730380882991922,1252.3585836206248,0.9790481578125001,0.0,0.0
27
- Seasonal Naive,19.444444444444446,0.0,0.0,1.2681127877083334,0.0,0.0
28
- Naive,14.629629629629632,-7.297793646802875,0.0,1.2969351423177082,0.0,0.0
29
- Drift,13.333333333333334,0.404190086867684,0.0,1.3917920932291667,0.0,0.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tables/domain_health/leaderboard_WAPE.csv DELETED
@@ -1,29 +0,0 @@
1
- model_name,win_rate,skill_score,median_training_time_s_per100,median_inference_time_s_per100,training_corpus_overlap,num_failures
2
- TimesFM-2.5,69.62962962962965,30.236433011588616,0.0,1.1256479395833334,0.0,0.0
3
- TiRex-2,68.14814814814817,26.601930748682324,0.0,0.3575023838736039,0.0,0.0
4
- TabPFN-TS-3,67.77777777777779,27.06736057976333,0.0,199.6776895770319,0.0,0.0
5
- Chronos-2,66.2962962962963,29.12048347898083,0.0,0.3492251116666667,0.0,0.0
6
- Toto-2.0-2.5B,64.07407407407408,23.803402469752132,0.0,5.925324101666666,0.0,0.0
7
- TiRex,63.70370370370372,29.759653720585042,0.0,0.330588668125,0.0,0.0
8
- FlowState,62.22222222222222,25.714346434991153,0.0,1.679734656979167,0.0,0.0
9
- Moirai-2.0,60.92592592592593,31.595921669939887,0.0,0.3505868739583333,0.1,0.0
10
- Toto-1.0,60.370370370370374,28.753205083598854,0.0,9.804296426666667,0.0,0.0
11
- Toto-2.0-313m,59.25925925925927,23.159110215973843,0.0,1.1242909435416668,0.0,0.0
12
- Toto-2.0-22m,58.51851851851851,23.737937635347716,0.0,0.4238227016666667,0.0,0.0
13
- Toto-2.0-1B,58.14814814814815,22.479955103457115,0.0,2.728815209166667,0.0,0.0
14
- TabPFN-TS,57.407407407407405,29.1761523445201,0.0,53.951610824166664,0.0,0.0
15
- AutoETS,56.666666666666664,29.45241897965094,0.0,2.5273205354166666,0.0,0.0
16
- Toto-2.0-4m,55.92592592592594,24.961571876693643,0.0,0.36290417583333334,0.0,0.0
17
- Stat. Ensemble,55.925925925925924,29.6956210738891,0.0,191.30953815208332,0.0,0.0
18
- LightGBM,54.81481481481482,28.23998648969035,1.2161332720833333,0.19742606979166666,0.0,0.0
19
- Chronos-Bolt,52.77777777777778,25.883263022341175,0.0,0.41178704374999997,0.0,0.0
20
- CatBoost,47.77777777777777,24.80079887494443,13.210264008932292,0.19426541770833333,0.0,0.0
21
- Sundial-Base,41.85185185185184,16.462366143379946,0.0,8.29280267,0.0,0.0
22
- AutoARIMA,36.66666666666667,15.90999185953288,0.0,7.6933014760416665,0.0,0.0
23
- AutoTheta,30.740740740740733,14.265515876146328,0.0,2.3246237520833333,0.0,0.0
24
- DeepAR,28.148148148148156,4.835755105983619,1252.3585836206248,0.9790481578125001,0.0,0.0
25
- Drift,26.296296296296294,6.995102476216641,0.0,1.3917920932291667,0.0,0.0
26
- TFT,24.814814814814813,-0.6246028567987283,577.3621929408333,0.91290832015625,0.0,0.0
27
- Seasonal Naive,24.629629629629633,0.0,0.0,1.2681127877083334,0.0,0.0
28
- Naive,24.629629629629626,0.09410405602899852,0.0,1.2969351423177082,0.0,0.0
29
- PatchTST,21.851851851851848,2.754946880183251,812.3820815818749,0.4485787422916667,0.0,0.0