Michael Rabinovich commited on
Commit ·
bd9b6ba
1
Parent(s): 0a04e61
submit: keep eval-gpu image repo as a fixed literal
Browse filesrevert the env-var indirection; the audit sweep stays prose-only and
must not alter dispatch resolution. the repo id and job namespace are
real deployed identities, kept as documented constants.
submit.py
CHANGED
|
@@ -20,8 +20,8 @@ poll of an HF Jobs GPU eval + boot-time stuck-pending sweep. The
|
|
| 20 |
handler validates the upload, uploads the zip to
|
| 21 |
``submissions/<id>.zip``, appends a ``status: pending`` row to
|
| 22 |
``results.jsonl`` (under a process-wide lock), spawns a daemon thread
|
| 23 |
-
that dispatches a per-submission HF Job against the
|
| 24 |
-
|
| 25 |
``inspect_job`` until the job's stage is terminal. On COMPLETED the
|
| 26 |
worker downloads ``reports/<id>.json`` (the Job already uploaded
|
| 27 |
``reports/<id>.{html,json}`` to the submissions dataset), reads
|
|
@@ -111,7 +111,7 @@ from huggingface_hub import (
|
|
| 111 |
)
|
| 112 |
from huggingface_hub.errors import EntryNotFoundError
|
| 113 |
|
| 114 |
-
from leaderboard import HF_DATA_REPO,
|
| 115 |
|
| 116 |
logger = logging.getLogger(__name__)
|
| 117 |
|
|
@@ -136,16 +136,11 @@ STUCK_PENDING_REASON = "evaluation interrupted by Space restart"
|
|
| 136 |
BOOT_SWEEP_ENV = "CADGENBENCH_DISABLE_BOOT_SWEEP"
|
| 137 |
|
| 138 |
# HF Jobs target. The eval-gpu image is hosted as a Docker Space
|
| 139 |
-
# (paused; image-only)
|
| 140 |
-
#
|
| 141 |
-
#
|
| 142 |
-
#
|
| 143 |
-
|
| 144 |
-
# so it is deliberately not configurable. a10g-large fits
|
| 145 |
-
# cadgenbench evaluate --workers 8 comfortably in 46 GB RAM.
|
| 146 |
-
EVAL_GPU_SPACE = os.getenv(
|
| 147 |
-
"CADGENBENCH_EVAL_GPU_SPACE", f"{HF_ORG}/cadgenbench-eval-gpu"
|
| 148 |
-
)
|
| 149 |
EVAL_JOB_FLAVOR = "a10g-large"
|
| 150 |
EVAL_JOB_NAMESPACE = "michaelr27"
|
| 151 |
EVAL_JOB_TIMEOUT = "30m"
|
|
|
|
| 20 |
handler validates the upload, uploads the zip to
|
| 21 |
``submissions/<id>.zip``, appends a ``status: pending`` row to
|
| 22 |
``results.jsonl`` (under a process-wide lock), spawns a daemon thread
|
| 23 |
+
that dispatches a per-submission HF Job against the
|
| 24 |
+
``HuggingAI4Engineering/cadgenbench-eval-gpu`` image and polls
|
| 25 |
``inspect_job`` until the job's stage is terminal. On COMPLETED the
|
| 26 |
worker downloads ``reports/<id>.json`` (the Job already uploaded
|
| 27 |
``reports/<id>.{html,json}`` to the submissions dataset), reads
|
|
|
|
| 111 |
)
|
| 112 |
from huggingface_hub.errors import EntryNotFoundError
|
| 113 |
|
| 114 |
+
from leaderboard import HF_DATA_REPO, HF_SUBMISSIONS_REPO
|
| 115 |
|
| 116 |
logger = logging.getLogger(__name__)
|
| 117 |
|
|
|
|
| 136 |
BOOT_SWEEP_ENV = "CADGENBENCH_DISABLE_BOOT_SWEEP"
|
| 137 |
|
| 138 |
# HF Jobs target. The eval-gpu image is hosted as a Docker Space
|
| 139 |
+
# (paused; image-only) at HuggingAI4Engineering/cadgenbench-eval-gpu.
|
| 140 |
+
# Jobs run under the personal `michaelr27` namespace (no-bill for
|
| 141 |
+
# HF employees per Round 6 of space-setup/leandro.md). a10g-large
|
| 142 |
+
# fits cadgenbench evaluate --workers 8 comfortably in 46 GB RAM.
|
| 143 |
+
EVAL_GPU_SPACE = "HuggingAI4Engineering/cadgenbench-eval-gpu"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 144 |
EVAL_JOB_FLAVOR = "a10g-large"
|
| 145 |
EVAL_JOB_NAMESPACE = "michaelr27"
|
| 146 |
EVAL_JOB_TIMEOUT = "30m"
|