Spaces:
Running
Running
Upload folder using huggingface_hub
Browse files- .gitattributes +4 -0
- logs/2026-02-02T13-00-41+00-00_hf-MathArena-aime-2025@895d9df74faf7aa8dedb081a1dde6a258e594e33_co73hNPnAePTvVsHmdiZt2.eval +3 -0
- logs/2026-02-02T13-03-14+00-00_hf-MathArena-aime-2025@895d9df74faf7aa8dedb081a1dde6a258e594e33_mSCwqPyiVswD6WnSEjVNs2.eval +0 -0
- logs/2026-02-02T13-03-50+00-00_hf-MathArena-aime-2025@895d9df74faf7aa8dedb081a1dde6a258e594e33_J35BMrWXGQA8T5n3nHHS7r.eval +3 -0
- logs/2026-02-02T13-25-44+00-00_hf-MathArena-aime-2025@ff26345f99c0a065526ca90fb89aa1ced562afb2_ix43E76FRHBTA4JkxeQ99D.eval +3 -0
- logs/2026-02-02T13-34-36+00-00_hf-MathArena-aime-2025@15e7287ff47020aa7163d48aa34862ba37e696bc_LpJvgh3TnKFpozAPNyp2Cw.eval +0 -0
- logs/2026-02-02T13-36-53+00-00_hf-MathArena-aime-2025@17c5d1ce7e5adea29aa3149fa6f1d45e62f00fff_aevZyyQdUobSMb2RU3Lsg7.eval +0 -0
- logs/2026-02-02T13-39-34+00-00_hf-MathArena-aime-2025@17c5d1ce7e5adea29aa3149fa6f1d45e62f00fff_C2FpQhKxw35GYXP8oyKEc6.eval +3 -0
- logs/listing.json +116 -0
.gitattributes
CHANGED
|
@@ -42,3 +42,7 @@ logs/2026-01-29T10-56-48+00-00_hf-MathArena-aime-2025@09a132a1496bd52de52ce3e9f5
|
|
| 42 |
logs/2026-01-30T12-25-52+00-00_hf-MathArena-aime-2025@895d9df74faf7aa8dedb081a1dde6a258e594e33_Gz7jkifS4nV3Hp9wQEJZhR.eval filter=lfs diff=lfs merge=lfs -text
|
| 43 |
logs/2026-01-30T12-32-34+00-00_hf-MathArena-aime-2025@895d9df74faf7aa8dedb081a1dde6a258e594e33_dNKnXHqqpsCfEkbaoYRfXy.eval filter=lfs diff=lfs merge=lfs -text
|
| 44 |
logs/2026-01-30T12-35-53+00-00_hf-MathArena-aime-2025@895d9df74faf7aa8dedb081a1dde6a258e594e33_UbXsSjiS7fFKnFgCqWtycz.eval filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 42 |
logs/2026-01-30T12-25-52+00-00_hf-MathArena-aime-2025@895d9df74faf7aa8dedb081a1dde6a258e594e33_Gz7jkifS4nV3Hp9wQEJZhR.eval filter=lfs diff=lfs merge=lfs -text
|
| 43 |
logs/2026-01-30T12-32-34+00-00_hf-MathArena-aime-2025@895d9df74faf7aa8dedb081a1dde6a258e594e33_dNKnXHqqpsCfEkbaoYRfXy.eval filter=lfs diff=lfs merge=lfs -text
|
| 44 |
logs/2026-01-30T12-35-53+00-00_hf-MathArena-aime-2025@895d9df74faf7aa8dedb081a1dde6a258e594e33_UbXsSjiS7fFKnFgCqWtycz.eval filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
logs/2026-02-02T13-00-41+00-00_hf-MathArena-aime-2025@895d9df74faf7aa8dedb081a1dde6a258e594e33_co73hNPnAePTvVsHmdiZt2.eval filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
logs/2026-02-02T13-03-50+00-00_hf-MathArena-aime-2025@895d9df74faf7aa8dedb081a1dde6a258e594e33_J35BMrWXGQA8T5n3nHHS7r.eval filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
logs/2026-02-02T13-25-44+00-00_hf-MathArena-aime-2025@ff26345f99c0a065526ca90fb89aa1ced562afb2_ix43E76FRHBTA4JkxeQ99D.eval filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
logs/2026-02-02T13-39-34+00-00_hf-MathArena-aime-2025@17c5d1ce7e5adea29aa3149fa6f1d45e62f00fff_C2FpQhKxw35GYXP8oyKEc6.eval filter=lfs diff=lfs merge=lfs -text
|
logs/2026-02-02T13-00-41+00-00_hf-MathArena-aime-2025@895d9df74faf7aa8dedb081a1dde6a258e594e33_co73hNPnAePTvVsHmdiZt2.eval
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d9b2c957156349dd5f9d36105dfe17633a7b99c5bfc3a5c3e90c0f10878ff6e5
|
| 3 |
+
size 261083
|
logs/2026-02-02T13-03-14+00-00_hf-MathArena-aime-2025@895d9df74faf7aa8dedb081a1dde6a258e594e33_mSCwqPyiVswD6WnSEjVNs2.eval
ADDED
|
Binary file (2.18 kB). View file
|
|
|
logs/2026-02-02T13-03-50+00-00_hf-MathArena-aime-2025@895d9df74faf7aa8dedb081a1dde6a258e594e33_J35BMrWXGQA8T5n3nHHS7r.eval
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eb894b84a49c9524f0b3b1ed644b9b5c9baad4e6329b60b52185661c225962a4
|
| 3 |
+
size 192319
|
logs/2026-02-02T13-25-44+00-00_hf-MathArena-aime-2025@ff26345f99c0a065526ca90fb89aa1ced562afb2_ix43E76FRHBTA4JkxeQ99D.eval
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a05c8816e1c379408822cebbab7e51bc3f9d44067c4e5e6cbe14a538275d1061
|
| 3 |
+
size 242019
|
logs/2026-02-02T13-34-36+00-00_hf-MathArena-aime-2025@15e7287ff47020aa7163d48aa34862ba37e696bc_LpJvgh3TnKFpozAPNyp2Cw.eval
ADDED
|
Binary file (19.3 kB). View file
|
|
|
logs/2026-02-02T13-36-53+00-00_hf-MathArena-aime-2025@17c5d1ce7e5adea29aa3149fa6f1d45e62f00fff_aevZyyQdUobSMb2RU3Lsg7.eval
ADDED
|
Binary file (21.6 kB). View file
|
|
|
logs/2026-02-02T13-39-34+00-00_hf-MathArena-aime-2025@17c5d1ce7e5adea29aa3149fa6f1d45e62f00fff_C2FpQhKxw35GYXP8oyKEc6.eval
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eb5adf6e1d85f1aea2ba6c853bf4a54b4249f2aeb4579c5e5293ed23a17a2b19
|
| 3 |
+
size 7460548
|
logs/listing.json
CHANGED
|
@@ -1,4 +1,120 @@
|
|
| 1 |
{
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2 |
"2026-01-30T12-35-53+00-00_hf-MathArena-aime-2025@895d9df74faf7aa8dedb081a1dde6a258e594e33_UbXsSjiS7fFKnFgCqWtycz.eval": {
|
| 3 |
"eval_id": "kum6GMmigXaMnU7EZkP8sM",
|
| 4 |
"run_id": "g84K6KqP73tPXxgCiWmt4M",
|
|
|
|
| 1 |
{
|
| 2 |
+
"2026-02-02T13-39-34+00-00_hf-MathArena-aime-2025@17c5d1ce7e5adea29aa3149fa6f1d45e62f00fff_C2FpQhKxw35GYXP8oyKEc6.eval": {
|
| 3 |
+
"eval_id": "Vqyg34jp4KsdctXr5uZ9VJ",
|
| 4 |
+
"run_id": "S4WiFt6XBqwrCRYXiSL5Es",
|
| 5 |
+
"task": "hf/MathArena/aime_2025@17c5d1ce7e5adea29aa3149fa6f1d45e62f00fff",
|
| 6 |
+
"task_id": "C2FpQhKxw35GYXP8oyKEc6",
|
| 7 |
+
"task_version": 0,
|
| 8 |
+
"version": 2,
|
| 9 |
+
"status": "success",
|
| 10 |
+
"invalidated": false,
|
| 11 |
+
"model": "openai/o4-mini",
|
| 12 |
+
"started_at": "2026-02-02T13:39:34+00:00",
|
| 13 |
+
"completed_at": "2026-02-02T13:54:48+00:00",
|
| 14 |
+
"primary_metric": {
|
| 15 |
+
"name": "accuracy",
|
| 16 |
+
"value": 0.8666666666666667,
|
| 17 |
+
"params": {}
|
| 18 |
+
}
|
| 19 |
+
},
|
| 20 |
+
"2026-02-02T13-36-53+00-00_hf-MathArena-aime-2025@17c5d1ce7e5adea29aa3149fa6f1d45e62f00fff_aevZyyQdUobSMb2RU3Lsg7.eval": {
|
| 21 |
+
"eval_id": "VTmCpkqBvLDmgBgkrD9uRr",
|
| 22 |
+
"run_id": "MPLHBoWnGoCM9DH5mAaG79",
|
| 23 |
+
"task": "hf/MathArena/aime_2025@17c5d1ce7e5adea29aa3149fa6f1d45e62f00fff",
|
| 24 |
+
"task_id": "aevZyyQdUobSMb2RU3Lsg7",
|
| 25 |
+
"task_version": 0,
|
| 26 |
+
"version": 2,
|
| 27 |
+
"status": "success",
|
| 28 |
+
"invalidated": false,
|
| 29 |
+
"model": "openai/o4-mini",
|
| 30 |
+
"started_at": "2026-02-02T13:36:53+00:00",
|
| 31 |
+
"completed_at": "2026-02-02T13:38:14+00:00",
|
| 32 |
+
"primary_metric": {
|
| 33 |
+
"name": "accuracy",
|
| 34 |
+
"value": 1.0,
|
| 35 |
+
"params": {}
|
| 36 |
+
}
|
| 37 |
+
},
|
| 38 |
+
"2026-02-02T13-34-36+00-00_hf-MathArena-aime-2025@15e7287ff47020aa7163d48aa34862ba37e696bc_LpJvgh3TnKFpozAPNyp2Cw.eval": {
|
| 39 |
+
"eval_id": "KEazAwxonijv8gKPjYPoNt",
|
| 40 |
+
"run_id": "VD2rYZbBxtsRK863F3Z8n5",
|
| 41 |
+
"task": "hf/MathArena/aime_2025@15e7287ff47020aa7163d48aa34862ba37e696bc",
|
| 42 |
+
"task_id": "LpJvgh3TnKFpozAPNyp2Cw",
|
| 43 |
+
"task_version": 0,
|
| 44 |
+
"version": 2,
|
| 45 |
+
"status": "success",
|
| 46 |
+
"invalidated": false,
|
| 47 |
+
"model": "openai/o4-mini",
|
| 48 |
+
"started_at": "2026-02-02T13:34:36+00:00",
|
| 49 |
+
"completed_at": "2026-02-02T13:35:28+00:00",
|
| 50 |
+
"primary_metric": {
|
| 51 |
+
"name": "accuracy",
|
| 52 |
+
"value": 1.0,
|
| 53 |
+
"params": {}
|
| 54 |
+
}
|
| 55 |
+
},
|
| 56 |
+
"2026-02-02T13-25-44+00-00_hf-MathArena-aime-2025@ff26345f99c0a065526ca90fb89aa1ced562afb2_ix43E76FRHBTA4JkxeQ99D.eval": {
|
| 57 |
+
"eval_id": "H8PxDxJe23ibiYyEZdmStS",
|
| 58 |
+
"run_id": "XsyPhsRd2jgbXkAWzqLStZ",
|
| 59 |
+
"task": "hf/MathArena/aime_2025@ff26345f99c0a065526ca90fb89aa1ced562afb2",
|
| 60 |
+
"task_id": "ix43E76FRHBTA4JkxeQ99D",
|
| 61 |
+
"task_version": 0,
|
| 62 |
+
"version": 2,
|
| 63 |
+
"status": "success",
|
| 64 |
+
"invalidated": false,
|
| 65 |
+
"model": "openai/o4-mini",
|
| 66 |
+
"started_at": "2026-02-02T13:25:44+00:00",
|
| 67 |
+
"completed_at": "2026-02-02T13:27:15+00:00",
|
| 68 |
+
"primary_metric": {
|
| 69 |
+
"name": "accuracy",
|
| 70 |
+
"value": 1.0,
|
| 71 |
+
"params": {}
|
| 72 |
+
}
|
| 73 |
+
},
|
| 74 |
+
"2026-02-02T13-03-50+00-00_hf-MathArena-aime-2025@895d9df74faf7aa8dedb081a1dde6a258e594e33_J35BMrWXGQA8T5n3nHHS7r.eval": {
|
| 75 |
+
"eval_id": "Q89SzdgfGmWWbfhhsS6so7",
|
| 76 |
+
"run_id": "kEgN6gDgzV6isp8Mgy8RXY",
|
| 77 |
+
"task": "hf/MathArena/aime_2025@895d9df74faf7aa8dedb081a1dde6a258e594e33",
|
| 78 |
+
"task_id": "J35BMrWXGQA8T5n3nHHS7r",
|
| 79 |
+
"task_version": 0,
|
| 80 |
+
"version": 2,
|
| 81 |
+
"status": "success",
|
| 82 |
+
"invalidated": false,
|
| 83 |
+
"model": "openai/o4-mini",
|
| 84 |
+
"started_at": "2026-02-02T13:03:50+00:00",
|
| 85 |
+
"completed_at": "2026-02-02T13:05:05+00:00",
|
| 86 |
+
"primary_metric": {
|
| 87 |
+
"name": "accuracy",
|
| 88 |
+
"value": 1.0,
|
| 89 |
+
"params": {}
|
| 90 |
+
}
|
| 91 |
+
},
|
| 92 |
+
"2026-02-02T13-03-14+00-00_hf-MathArena-aime-2025@895d9df74faf7aa8dedb081a1dde6a258e594e33_mSCwqPyiVswD6WnSEjVNs2.eval": {
|
| 93 |
+
"eval_id": "f6vyPkUpNgDTfKTraw87wJ",
|
| 94 |
+
"run_id": "i4J7MxMbY5Uzeq8yffigaa",
|
| 95 |
+
"task": "hf/MathArena/aime_2025@895d9df74faf7aa8dedb081a1dde6a258e594e33",
|
| 96 |
+
"task_id": "mSCwqPyiVswD6WnSEjVNs2",
|
| 97 |
+
"task_version": 0,
|
| 98 |
+
"version": 2,
|
| 99 |
+
"status": "cancelled",
|
| 100 |
+
"invalidated": false,
|
| 101 |
+
"model": "openai/o4-mini",
|
| 102 |
+
"started_at": "2026-02-02T13:03:14+00:00",
|
| 103 |
+
"completed_at": "2026-02-02T13:03:24+00:00"
|
| 104 |
+
},
|
| 105 |
+
"2026-02-02T13-00-41+00-00_hf-MathArena-aime-2025@895d9df74faf7aa8dedb081a1dde6a258e594e33_co73hNPnAePTvVsHmdiZt2.eval": {
|
| 106 |
+
"eval_id": "H4RWdgPxrpbYDKpN8di6yo",
|
| 107 |
+
"run_id": "GezXvQeiSHrChxxq5G4f5k",
|
| 108 |
+
"task": "hf/MathArena/aime_2025@895d9df74faf7aa8dedb081a1dde6a258e594e33",
|
| 109 |
+
"task_id": "co73hNPnAePTvVsHmdiZt2",
|
| 110 |
+
"task_version": 0,
|
| 111 |
+
"version": 2,
|
| 112 |
+
"status": "cancelled",
|
| 113 |
+
"invalidated": false,
|
| 114 |
+
"model": "openai/o4-mini",
|
| 115 |
+
"started_at": "2026-02-02T13:00:41+00:00",
|
| 116 |
+
"completed_at": "2026-02-02T13:02:32+00:00"
|
| 117 |
+
},
|
| 118 |
"2026-01-30T12-35-53+00-00_hf-MathArena-aime-2025@895d9df74faf7aa8dedb081a1dde6a258e594e33_UbXsSjiS7fFKnFgCqWtycz.eval": {
|
| 119 |
"eval_id": "kum6GMmigXaMnU7EZkP8sM",
|
| 120 |
"run_id": "g84K6KqP73tPXxgCiWmt4M",
|