Spaces:
Running
Running
Upload logs/listing.json with huggingface_hub
Browse files- logs/listing.json +144 -0
logs/listing.json
ADDED
|
@@ -0,0 +1,144 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"2025-11-07T12-02-37+01-00_midicaps-eval_hDhVbXtsZzwnnJ2S5AUBNY.eval": {
|
| 3 |
+
"eval_id": "eFRJm4KVGpLH2hZtXsJK6F",
|
| 4 |
+
"run_id": "GzfPVZNZAWtm6HuyduafVK",
|
| 5 |
+
"task": "midicaps_eval",
|
| 6 |
+
"task_id": "hDhVbXtsZzwnnJ2S5AUBNY",
|
| 7 |
+
"task_version": 0,
|
| 8 |
+
"version": 2,
|
| 9 |
+
"status": "success",
|
| 10 |
+
"model": "hf-inference-providers/Qwen/Qwen3-32B:fastest",
|
| 11 |
+
"started_at": "2025-11-07T12:02:38+01:00",
|
| 12 |
+
"completed_at": "2025-11-07T12:50:15+01:00",
|
| 13 |
+
"primary_metric": {
|
| 14 |
+
"name": "accuracy",
|
| 15 |
+
"value": 0.227,
|
| 16 |
+
"params": {}
|
| 17 |
+
}
|
| 18 |
+
},
|
| 19 |
+
"2025-11-07T11-54-09+01-00_midicaps-eval_9NrHE4AKTLRhZvcLQ2Gabv.eval": {
|
| 20 |
+
"eval_id": "37ZzdHjULJ7bS8cEGV3pZH",
|
| 21 |
+
"run_id": "iNoJBzcsw9oCYy7YMaVQnK",
|
| 22 |
+
"task": "midicaps_eval",
|
| 23 |
+
"task_id": "9NrHE4AKTLRhZvcLQ2Gabv",
|
| 24 |
+
"task_version": 0,
|
| 25 |
+
"version": 2,
|
| 26 |
+
"status": "cancelled",
|
| 27 |
+
"model": "hf-inference-providers/Qwen/Qwen3-32B:fastest",
|
| 28 |
+
"started_at": "2025-11-07T11:54:09+01:00",
|
| 29 |
+
"completed_at": "2025-11-07T12:02:16+01:00"
|
| 30 |
+
},
|
| 31 |
+
"2025-11-07T11-50-36+01-00_midicaps-eval_exs5ySFazLtdTrKS8SM8yU.eval": {
|
| 32 |
+
"eval_id": "h3a9z7BD3VA7qq2jg68j6m",
|
| 33 |
+
"run_id": "edqJkT8qrHcLBBPKvnDajP",
|
| 34 |
+
"task": "midicaps_eval",
|
| 35 |
+
"task_id": "exs5ySFazLtdTrKS8SM8yU",
|
| 36 |
+
"task_version": 0,
|
| 37 |
+
"version": 2,
|
| 38 |
+
"status": "cancelled",
|
| 39 |
+
"model": "hf-inference-providers/Qwen/Qwen3-235B-A22B-Thinking-2507:fastest",
|
| 40 |
+
"started_at": "2025-11-07T11:50:36+01:00",
|
| 41 |
+
"completed_at": "2025-11-07T11:53:50+01:00"
|
| 42 |
+
},
|
| 43 |
+
"2025-11-07T11-39-00+01-00_midicaps-eval_dDZdCH42Ff6a5uk9oDQr5K.eval": {
|
| 44 |
+
"eval_id": "Seec6xaRvmTcFwGyDWbThG",
|
| 45 |
+
"run_id": "grJSKX9cs2mppsTye94inj",
|
| 46 |
+
"task": "midicaps_eval",
|
| 47 |
+
"task_id": "dDZdCH42Ff6a5uk9oDQr5K",
|
| 48 |
+
"task_version": 0,
|
| 49 |
+
"version": 2,
|
| 50 |
+
"status": "cancelled",
|
| 51 |
+
"model": "hf-inference-providers/Qwen/Qwen3-32B:fastest",
|
| 52 |
+
"started_at": "2025-11-07T11:39:00+01:00",
|
| 53 |
+
"completed_at": "2025-11-07T11:51:54+01:00"
|
| 54 |
+
},
|
| 55 |
+
"2025-11-07T11-38-04+01-00_midicaps-eval_Rhfv7o4SjhPi7ZCTtPUKLU.eval": {
|
| 56 |
+
"eval_id": "cJ5hhCUhGJiLkRGLpG9ptf",
|
| 57 |
+
"run_id": "Ze8BNnL2zmRRs6nE6gHUEm",
|
| 58 |
+
"task": "midicaps_eval",
|
| 59 |
+
"task_id": "Rhfv7o4SjhPi7ZCTtPUKLU",
|
| 60 |
+
"task_version": 0,
|
| 61 |
+
"version": 2,
|
| 62 |
+
"status": "cancelled",
|
| 63 |
+
"model": "hf-inference-providers/Qwen/Qwen3-Coder-30B-A3B-Instruct:fastest",
|
| 64 |
+
"started_at": "2025-11-07T11:38:04+01:00",
|
| 65 |
+
"completed_at": "2025-11-07T11:38:56+01:00"
|
| 66 |
+
},
|
| 67 |
+
"2025-11-07T11-35-40+01-00_midicaps-eval_7VV87LrTdV8nNoNekw65Kn.eval": {
|
| 68 |
+
"eval_id": "SjfEAhBgUt9wP3mGay99DR",
|
| 69 |
+
"run_id": "XUKH6RAPAkshtfwf499aTN",
|
| 70 |
+
"task": "midicaps_eval",
|
| 71 |
+
"task_id": "7VV87LrTdV8nNoNekw65Kn",
|
| 72 |
+
"task_version": 0,
|
| 73 |
+
"version": 2,
|
| 74 |
+
"status": "cancelled",
|
| 75 |
+
"model": "hf-inference-providers/Qwen/Qwen3-32B:fastest",
|
| 76 |
+
"started_at": "2025-11-07T11:35:40+01:00",
|
| 77 |
+
"completed_at": "2025-11-07T11:37:53+01:00"
|
| 78 |
+
},
|
| 79 |
+
"2025-11-07T11-22-29+01-00_midicaps-eval_EQ4Un4guSWakEqJEJZb6nV.eval": {
|
| 80 |
+
"eval_id": "djNFMh8zDxhfYQiLWBvHBy",
|
| 81 |
+
"run_id": "YGfXwk5Vywy2cyQXi6WzjM",
|
| 82 |
+
"task": "midicaps_eval",
|
| 83 |
+
"task_id": "EQ4Un4guSWakEqJEJZb6nV",
|
| 84 |
+
"task_version": 0,
|
| 85 |
+
"version": 2,
|
| 86 |
+
"status": "started",
|
| 87 |
+
"model": "hf-inference-providers/Qwen/Qwen3-32B:fastest",
|
| 88 |
+
"started_at": "",
|
| 89 |
+
"completed_at": ""
|
| 90 |
+
},
|
| 91 |
+
"2025-11-07T11-21-27+01-00_midicaps-eval_HLEuNJaKXpnfToGJGaykfF.eval": {
|
| 92 |
+
"eval_id": "NKiTnZPd5dQN6aZdibko9K",
|
| 93 |
+
"run_id": "SaccU3nZNy4t3VwpYNu232",
|
| 94 |
+
"task": "midicaps_eval",
|
| 95 |
+
"task_id": "HLEuNJaKXpnfToGJGaykfF",
|
| 96 |
+
"task_version": 0,
|
| 97 |
+
"version": 2,
|
| 98 |
+
"status": "cancelled",
|
| 99 |
+
"model": "hf-inference-providers/Qwen/Qwen3-32B",
|
| 100 |
+
"started_at": "2025-11-07T11:21:27+01:00",
|
| 101 |
+
"completed_at": "2025-11-07T11:22:20+01:00"
|
| 102 |
+
},
|
| 103 |
+
"2025-11-07T11-14-26+01-00_midicaps-eval_WCXLiYz4DB5D8gq5veChtq.eval": {
|
| 104 |
+
"eval_id": "XvcyPZ2QvGzbgW3z5mRuPX",
|
| 105 |
+
"run_id": "TmJBsKvpafwbxztQBVvGxE",
|
| 106 |
+
"task": "midicaps_eval",
|
| 107 |
+
"task_id": "WCXLiYz4DB5D8gq5veChtq",
|
| 108 |
+
"task_version": 0,
|
| 109 |
+
"version": 2,
|
| 110 |
+
"status": "cancelled",
|
| 111 |
+
"model": "hf-inference-providers/Qwen/Qwen3-4B-Instruct-2507",
|
| 112 |
+
"started_at": "2025-11-07T11:14:27+01:00",
|
| 113 |
+
"completed_at": "2025-11-07T11:16:55+01:00"
|
| 114 |
+
},
|
| 115 |
+
"2025-11-07T10-52-12+01-00_midicaps-eval_oFryNzzE8niNqXs9jzctrK.eval": {
|
| 116 |
+
"eval_id": "gQTsZtytgKX9s7Qs4wVATE",
|
| 117 |
+
"run_id": "nJA2gJvTXgJP4iZwwN4h6d",
|
| 118 |
+
"task": "midicaps_eval",
|
| 119 |
+
"task_id": "oFryNzzE8niNqXs9jzctrK",
|
| 120 |
+
"task_version": 0,
|
| 121 |
+
"version": 2,
|
| 122 |
+
"status": "cancelled",
|
| 123 |
+
"model": "hf-inference-providers/Qwen/Qwen3-4B-Instruct-2507",
|
| 124 |
+
"started_at": "2025-11-07T10:52:12+01:00",
|
| 125 |
+
"completed_at": "2025-11-07T10:54:23+01:00"
|
| 126 |
+
},
|
| 127 |
+
"2025-11-07T10-50-54+01-00_midicaps-eval_Cr3ecgUpLMNJBqrXFeLUG5.eval": {
|
| 128 |
+
"eval_id": "iiQxPgsyzaKyzWwNAwCqvn",
|
| 129 |
+
"run_id": "TjJbK3cMJm3yrKPUAuKkN7",
|
| 130 |
+
"task": "midicaps_eval",
|
| 131 |
+
"task_id": "Cr3ecgUpLMNJBqrXFeLUG5",
|
| 132 |
+
"task_version": 0,
|
| 133 |
+
"version": 2,
|
| 134 |
+
"status": "error",
|
| 135 |
+
"error": {
|
| 136 |
+
"message": "Error code: 404 - {'error': {'code': 'NOT_FOUND', 'message': 'Model not found, inaccessible, and/or not deployed', 'requestId': 'Root=1-690dc101-25e065e116024630252580c2-chatcmpl-c1328c2', 'param': 'model'}}",
|
| 137 |
+
"traceback": "Traceback (most recent call last):\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/_eval/task/run.py\", line 384, in task_run\n sample_results = await tg_collect(\n ^^^^^^^^^^^^^^^^^\n ...<7 lines>...\n )\n ^\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/_util/_async.py\", line 76, in tg_collect\n raise ex.exceptions[0] from None\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/_util/_async.py\", line 64, in run_task\n result = await func()\n ^^^^^^^^^^^^\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/_eval/task/run.py\", line 353, in run_sample\n return await task_run_sample(\n ^^^^^^^^^^^^^^^^^^^^^^\n ...<28 lines>...\n )\n ^\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/_eval/task/run.py\", line 1034, in task_run_sample\n raise raise_error\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/_eval/task/run.py\", line 826, in task_run_sample\n raise inner_exception(ex)\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/_eval/task/run.py\", line 767, in run\n state = await plan(state, generate)\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/solver/_plan.py\", line 105, in __call__\n state = await solver(state, generate)\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/solver/_solver.py\", line 289, in solve\n return await generate(state, tool_calls=tool_calls, cache=cache, **kwargs)\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/_eval/task/run.py\", line 292, in generate\n return await task_generate(\n ^^^^^^^^^^^^^^^^^^^^\n ...<5 lines>...\n )\n ^\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/_eval/task/generate.py\", line 27, in task_generate\n state.output = await model.generate(\n ^^^^^^^^^^^^^^^^^^^^^\n ...<5 lines>...\n )\n ^\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/model/_model.py\", line 486, in generate\n output, event = await self._generate(\n ^^^^^^^^^^^^^^^^^^^^^\n ...<5 lines>...\n )\n ^\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/model/_model.py\", line 796, in _generate\n model_output, event = await generate()\n ^^^^^^^^^^^^^^^^\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/tenacity/asyncio/__init__.py\", line 189, in async_wrapped\n return await copy(fn, *args, **kwargs)\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/tenacity/asyncio/__init__.py\", line 111, in __call__\n do = await self.iter(retry_state=retry_state)\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/tenacity/asyncio/__init__.py\", line 153, in iter\n result = await action(retry_state)\n ^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/tenacity/_utils.py\", line 99, in inner\n return call(*args, **kwargs)\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/tenacity/__init__.py\", line 400, in <lambda>\n self._add_action_func(lambda rs: rs.outcome.result())\n ~~~~~~~~~~~~~~~~~^^\n File \"/opt/homebrew/Cellar/python@3.13/3.13.0_1/Frameworks/Python.framework/Versions/3.13/lib/python3.13/concurrent/futures/_base.py\", line 449, in result\n return self.__get_result()\n ~~~~~~~~~~~~~~~~~^^\n File \"/opt/homebrew/Cellar/python@3.13/3.13.0_1/Frameworks/Python.framework/Versions/3.13/lib/python3.13/concurrent/futures/_base.py\", line 401, in __get_result\n raise self._exception\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/tenacity/asyncio/__init__.py\", line 114, in __call__\n result = await fn(*args, **kwargs)\n ^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/model/_model.py\", line 727, in generate\n result = await self.api.generate(\n ^^^^^^^^^^^^^^^^^^^^^^^^\n ...<4 lines>...\n )\n ^\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/model/_providers/openai_compatible.py\", line 214, in generate\n completion = await self._generate_completion(request, config)\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/model/_providers/openai_compatible.py\", line 248, in _generate_completion\n ChatCompletion, await self.client.chat.completions.create(**request)\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/openai/resources/chat/completions/completions.py\", line 2603, in create\n return await self._post(\n ^^^^^^^^^^^^^^^^^\n ...<48 lines>...\n )\n ^\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/openai/_base_client.py\", line 1794, in post\n return await self.request(cast_to, opts, stream=stream, stream_cls=stream_cls)\n ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n File \"/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/openai/_base_client.py\", line 1594, in request\n raise self._make_status_error_from_response(err.response) from None\nopenai.NotFoundError: Error code: 404 - {'error': {'code': 'NOT_FOUND', 'message': 'Model not found, inaccessible, and/or not deployed', 'requestId': 'Root=1-690dc101-25e065e116024630252580c2-chatcmpl-c1328c2', 'param': 'model'}}\n",
|
| 138 |
+
"traceback_ansi": "\u001b[31mββ\u001b[0m\u001b[31mβββββββββββββββββββββββββββββββββββββββ\u001b[0m\u001b[31m \u001b[0m\u001b[1;31mTraceback \u001b[0m\u001b[1;2;31m(most recent call last)\u001b[0m\u001b[31m \u001b[0m\u001b[31mβββββββββββββββββββββββββββββββββββββββ\u001b[0m\u001b[31mββ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/_eval/task/\u001b[0m\u001b[1mrun.py\u001b[0m:384 in task_run \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/_util/\u001b[0m\u001b[1m_async.py\u001b[0m:76 in tg_collect \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/_util/\u001b[0m\u001b[1m_async.py\u001b[0m:64 in run_task \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/_eval/task/\u001b[0m\u001b[1mrun.py\u001b[0m:353 in \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m run_sample \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/_eval/task/\u001b[0m\u001b[1mrun.py\u001b[0m:1034 in \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m task_run_sample \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/_eval/task/\u001b[0m\u001b[1mrun.py\u001b[0m:826 in \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m task_run_sample \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/_eval/task/\u001b[0m\u001b[1mrun.py\u001b[0m:767 in run \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/solver/\u001b[0m\u001b[1m_plan.py\u001b[0m:105 in __call__ \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/solver/\u001b[0m\u001b[1m_solver.py\u001b[0m:289 in solve \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/_eval/task/\u001b[0m\u001b[1mrun.py\u001b[0m:292 in generate \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/_eval/task/\u001b[0m\u001b[1mgenerate.py\u001b[0m:27 in \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m task_generate \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/model/\u001b[0m\u001b[1m_model.py\u001b[0m:486 in generate \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/model/\u001b[0m\u001b[1m_model.py\u001b[0m:796 in _generate \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/tenacity/asyncio/\u001b[0m\u001b[1m__init__.py\u001b[0m:189 in \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m async_wrapped \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/tenacity/asyncio/\u001b[0m\u001b[1m__init__.py\u001b[0m:111 in __call__ \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/tenacity/asyncio/\u001b[0m\u001b[1m__init__.py\u001b[0m:153 in iter \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/tenacity/\u001b[0m\u001b[1m_utils.py\u001b[0m:99 in inner \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/tenacity/\u001b[0m\u001b[1m__init__.py\u001b[0m:400 in <lambda> \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/opt/homebrew/Cellar/python@3.13/3.13.0_1/Frameworks/Python.framework/Versions/3.13/lib/python3.13/concurrent/fut\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2mures/\u001b[0m\u001b[1m_base.py\u001b[0m:449 in result \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m446 \u001b[0m\u001b[2mβ β β β \u001b[0m\u001b[94mif\u001b[0m \u001b[96mself\u001b[0m._state \u001b[95min\u001b[0m [CANCELLED, CANCELLED_AND_NOTIFIED]: \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m447 \u001b[0m\u001b[2mβ β β β β \u001b[0m\u001b[94mraise\u001b[0m CancelledError() \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m448 \u001b[0m\u001b[2mβ β β β \u001b[0m\u001b[94melif\u001b[0m \u001b[96mself\u001b[0m._state == FINISHED: \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31m> \u001b[0m449 \u001b[2mβ β β β β \u001b[0m\u001b[94mreturn\u001b[0m \u001b[96mself\u001b[0m.__get_result() \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m450 \u001b[0m\u001b[2mβ β β β \u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m451 \u001b[0m\u001b[2mβ β β β \u001b[0m\u001b[96mself\u001b[0m._condition.wait(timeout) \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m452 \u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/opt/homebrew/Cellar/python@3.13/3.13.0_1/Frameworks/Python.framework/Versions/3.13/lib/python3.13/concurrent/fut\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2mures/\u001b[0m\u001b[1m_base.py\u001b[0m:401 in __get_result \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m398 \u001b[0m\u001b[2mβ \u001b[0m\u001b[94mdef\u001b[0m\u001b[90m \u001b[0m\u001b[92m__get_result\u001b[0m(\u001b[96mself\u001b[0m): \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m399 \u001b[0m\u001b[2mβ β \u001b[0m\u001b[94mif\u001b[0m \u001b[96mself\u001b[0m._exception: \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m400 \u001b[0m\u001b[2mβ β β \u001b[0m\u001b[94mtry\u001b[0m: \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31m> \u001b[0m401 \u001b[2mβ β β β \u001b[0m\u001b[94mraise\u001b[0m \u001b[96mself\u001b[0m._exception \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m402 \u001b[0m\u001b[2mβ β β \u001b[0m\u001b[94mfinally\u001b[0m: \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m403 \u001b[0m\u001b[2mβ β β β \u001b[0m\u001b[2m# Break a reference cycle with the exception in self._exception\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m404 \u001b[0m\u001b[2mβ β β β \u001b[0m\u001b[1;4;96mself\u001b[0m = \u001b[94mNone\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/tenacity/asyncio/\u001b[0m\u001b[1m__init__.py\u001b[0m:114 in __call__ \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/model/\u001b[0m\u001b[1m_model.py\u001b[0m:727 in generate \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/model/_providers/\u001b[0m\u001b[1mopenai_compatible\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[1m.py\u001b[0m:214 in generate \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/inspect_ai/model/_providers/\u001b[0m\u001b[1mopenai_compatible\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[1m.py\u001b[0m:248 in _generate_completion \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/openai/resources/chat/completions/\u001b[0m\u001b[1mcompletions\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[1m.py\u001b[0m:2603 in create \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m2600 \u001b[0m\u001b[2mβ β \u001b[0mtimeout: \u001b[96mfloat\u001b[0m | httpx.Timeout | \u001b[94mNone\u001b[0m | NotGiven = not_given, \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m2601 \u001b[0m\u001b[2mβ \u001b[0m) -> ChatCompletion | AsyncStream[ChatCompletionChunk]: \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m2602 \u001b[0m\u001b[2mβ β \u001b[0mvalidate_response_format(response_format) \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31m> \u001b[0m2603 \u001b[2mβ β \u001b[0m\u001b[94mreturn\u001b[0m \u001b[1;4;94mawait\u001b[0m\u001b[1;4m \u001b[0m\u001b[1;4;96mself\u001b[0m\u001b[1;4m._post(\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m2604 \u001b[0m\u001b[2mβ β β \u001b[0m\u001b[1;4;33m\"\u001b[0m\u001b[1;4;33m/chat/completions\u001b[0m\u001b[1;4;33m\"\u001b[0m\u001b[1;4m,\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m2605 \u001b[0m\u001b[2mβ β β \u001b[0m\u001b[1;4mbody=\u001b[0m\u001b[1;4;94mawait\u001b[0m\u001b[1;4m async_maybe_transform(\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m2606 \u001b[0m\u001b[2mβ β β β \u001b[0m\u001b[1;4m{\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/openai/\u001b[0m\u001b[1m_base_client.py\u001b[0m:1794 in post \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m1791 \u001b[0m\u001b[2mβ β \u001b[0mopts = FinalRequestOptions.construct( \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m1792 \u001b[0m\u001b[2mβ β β \u001b[0mmethod=\u001b[33m\"\u001b[0m\u001b[33mpost\u001b[0m\u001b[33m\"\u001b[0m, url=path, json_data=body, files=\u001b[94mawait\u001b[0m async_to_httpx_files(fi \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m1793 \u001b[0m\u001b[2mβ β \u001b[0m) \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31m> \u001b[0m1794 \u001b[2mβ β \u001b[0m\u001b[94mreturn\u001b[0m \u001b[1;4;94mawait\u001b[0m\u001b[1;4m \u001b[0m\u001b[1;4;96mself\u001b[0m\u001b[1;4m.request(cast_to, opts, stream=stream, stream_cls=stream_cls)\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m1795 \u001b[0m\u001b[2mβ \u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m1796 \u001b[0m\u001b[2mβ \u001b[0m\u001b[94masync\u001b[0m \u001b[94mdef\u001b[0m\u001b[90m \u001b[0m\u001b[92mpatch\u001b[0m( \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m1797 \u001b[0m\u001b[2mβ β \u001b[0m\u001b[96mself\u001b[0m, \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m/Users/danielvilasuero/2025/mufi/.venv/lib/python3.13/site-packages/openai/\u001b[0m\u001b[1m_base_client.py\u001b[0m:1594 in request \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m1591 \u001b[0m\u001b[2mβ β β β β \u001b[0m\u001b[94mawait\u001b[0m err.response.aread() \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m1592 \u001b[0m\u001b[2mβ β β β \u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m1593 \u001b[0m\u001b[2mβ β β β \u001b[0mlog.debug(\u001b[33m\"\u001b[0m\u001b[33mRe-raising status error\u001b[0m\u001b[33m\"\u001b[0m) \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[31m> \u001b[0m1594 \u001b[2mβ β β β \u001b[0m\u001b[1;4;94mraise\u001b[0m\u001b[1;4m \u001b[0m\u001b[1;4;96mself\u001b[0m\u001b[1;4m._make_status_error_from_response(err.response) \u001b[0m\u001b[1;4;94mfrom\u001b[0m\u001b[1;4;90m \u001b[0m\u001b[1;4;94mNone\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m1595 \u001b[0m\u001b[2mβ β β \u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m1596 \u001b[0m\u001b[2mβ β β \u001b[0m\u001b[94mbreak\u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβ\u001b[0m \u001b[2m1597 \u001b[0m \u001b[31mβ\u001b[0m\n\u001b[31mβββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ\u001b[0m\n\u001b[1;91mNotFoundError: \u001b[0mError code: \u001b[1;36m404\u001b[0m - \u001b[1m{\u001b[0m\u001b[32m'error'\u001b[0m: \u001b[1m{\u001b[0m\u001b[32m'code'\u001b[0m: \u001b[32m'NOT_FOUND'\u001b[0m, \u001b[32m'message'\u001b[0m: \u001b[32m'Model not found, inaccessible, and/or \u001b[0m\n\u001b[32mnot deployed'\u001b[0m, \u001b[32m'requestId'\u001b[0m: \u001b[32m'\u001b[0m\u001b[32mRoot\u001b[0m\u001b[32m=\u001b[0m\u001b[32m1\u001b[0m\u001b[32m-690dc101-25e065e116024630252580c2-chatcmpl-c1328c2'\u001b[0m, \u001b[32m'param'\u001b[0m: \u001b[32m'model'\u001b[0m\u001b[1m}\u001b[0m\u001b[1m}\u001b[0m\n"
|
| 139 |
+
},
|
| 140 |
+
"model": "hf-inference-providers/Qwen/Qwen3-1.7B",
|
| 141 |
+
"started_at": "2025-11-07T10:50:54+01:00",
|
| 142 |
+
"completed_at": "2025-11-07T10:51:00+01:00"
|
| 143 |
+
}
|
| 144 |
+
}
|