Spaces:

lanczos
/

graphtestbed

Running

App Files Files Community

Zhu Jiajun (jz28583) Claude Opus 4.7 (1M context) commited on Apr 21

Commit

1a157a1

1 Parent(s): 9cb903d

Fix kaggle async: use sentinel -1.0 for pending (NOT NULL) + correct col names

Browse files

Files changed (1) hide show

server/api.py +19 -12

server/api.py CHANGED Viewed

@@ -51,6 +51,11 @@ MANIFEST_PATH = Path(os.environ.get(
 ))
 QUOTA_PER_DAY = int(os.environ.get("GT_QUOTA", "5"))
 BYPASS_KEY = os.environ.get("GT_BYPASS_KEY", "").strip() or None
 MAX_UPLOAD_BYTES = 50 * 1024 * 1024  # 50 MB hard cap
@@ -199,13 +204,13 @@ def _kaggle_poll_loop(competition: str, description: str, run_id: str,
                 final = (float("nan"), {"error": f"kaggle scoring failed: {err}"})
             break  # found our row; if still pending the inner loop falls through
     if final is None:
-        final = (float("nan"), {"error": f"polled {timeout_s}s without complete"})
     primary, secondary = final
-    # NaN can't go through SQLite NUMERIC; persist as NULL when scoring failed.
-    primary_db = None if primary != primary else primary  # NaN check
     conn = _db()
     conn.execute(
-        "UPDATE submissions SET primary_metric = ?, secondary = ? "
         "WHERE run_id = ?",
         (primary_db, _json.dumps(secondary), run_id),
     )
@@ -312,7 +317,8 @@ def submit():
             # the client never has to hold open a long-running connection
             # (HF Space's reverse proxy kills these around the 5-min mark).
             description = _kaggle_submit(comp, raw, run_id)
-            scored = {"primary": None, "secondary": {"status": "pending"},
                       "n_rows": -1}
             pending = True
         else:
@@ -389,7 +395,7 @@ def leaderboard(task: str):
         SELECT agent, MAX(primary_metric) as best, COUNT(*) as n_subs,
                MIN(submitted_at) as first_seen
         FROM submissions
-        WHERE task = ? AND primary_metric IS NOT NULL
         GROUP BY agent
         ORDER BY best DESC
     """, (task,)).fetchall()
@@ -411,7 +417,7 @@ def leaderboard_all():
     rows = conn.execute("""
         SELECT task, agent, MAX(primary_metric) as best
         FROM submissions
-        WHERE primary_metric IS NOT NULL
         GROUP BY task, agent
     """).fetchall()
     conn.close()
@@ -474,8 +480,8 @@ def run_status(run_id: str):
     """
     conn = _db()
     row = conn.execute("""
-        SELECT run_id, task, agent, primary_metric, secondary, sha256,
-               n_rows, ts
         FROM submissions WHERE run_id = ?
     """, (run_id,)).fetchone()
     conn.close()
@@ -483,11 +489,12 @@ def run_status(run_id: str):
         return jsonify({"error": f"no run '{run_id}'"}), 404
     rid, task, agent, primary, secondary, sha, n_rows, ts = row
     sec = json.loads(secondary) if secondary else {}
-    if primary is None:
-        # Kaggle backend, still polling
         status = "pending"
     elif sec.get("error"):
         status = "failed"
     else:
         status = "complete"
     return jsonify({
@@ -1267,7 +1274,7 @@ def landing():
             SELECT agent, MAX(primary_metric) AS p, COUNT(*) AS n,
                    MIN(submitted_at) AS f
             FROM submissions
-            WHERE task = ? AND primary_metric IS NOT NULL
             GROUP BY agent ORDER BY p DESC
         """, (name,)).fetchall()
         n_rows_cfg = s.get("n_rows")

 ))
 QUOTA_PER_DAY = int(os.environ.get("GT_QUOTA", "5"))
 BYPASS_KEY = os.environ.get("GT_BYPASS_KEY", "").strip() or None
+# Sentinel for kaggle-backend rows whose score is still being polled. The
+# submissions table has primary_metric NOT NULL so we can't store NULL —
+# leaderboard queries filter `primary_metric > -1`.
+_PENDING_SENTINEL = -1.0
 MAX_UPLOAD_BYTES = 50 * 1024 * 1024  # 50 MB hard cap
                 final = (float("nan"), {"error": f"kaggle scoring failed: {err}"})
             break  # found our row; if still pending the inner loop falls through
     if final is None:
+        final = (-1.0, {"error": f"polled {timeout_s}s without complete"})
     primary, secondary = final
+    # On failure leave the sentinel so it stays out of the leaderboard.
+    primary_db = -1.0 if primary != primary else primary  # NaN check
     conn = _db()
     conn.execute(
+        "UPDATE submissions SET primary_metric = ?, secondary_json = ? "
         "WHERE run_id = ?",
         (primary_db, _json.dumps(secondary), run_id),
     )
             # the client never has to hold open a long-running connection
             # (HF Space's reverse proxy kills these around the 5-min mark).
             description = _kaggle_submit(comp, raw, run_id)
+            scored = {"primary": _PENDING_SENTINEL,
+                      "secondary": {"status": "pending"},
                       "n_rows": -1}
             pending = True
         else:
         SELECT agent, MAX(primary_metric) as best, COUNT(*) as n_subs,
                MIN(submitted_at) as first_seen
         FROM submissions
+        WHERE task = ? AND primary_metric > -1
         GROUP BY agent
         ORDER BY best DESC
     """, (task,)).fetchall()
     rows = conn.execute("""
         SELECT task, agent, MAX(primary_metric) as best
         FROM submissions
+        WHERE primary_metric > -1
         GROUP BY task, agent
     """).fetchall()
     conn.close()
     """
     conn = _db()
     row = conn.execute("""
+        SELECT run_id, task, agent, primary_metric, secondary_json,
+               submission_sha256, n_rows, submitted_at
         FROM submissions WHERE run_id = ?
     """, (run_id,)).fetchone()
     conn.close()
         return jsonify({"error": f"no run '{run_id}'"}), 404
     rid, task, agent, primary, secondary, sha, n_rows, ts = row
     sec = json.loads(secondary) if secondary else {}
+    if primary == _PENDING_SENTINEL:
         status = "pending"
+        primary = None
     elif sec.get("error"):
         status = "failed"
+        primary = None
     else:
         status = "complete"
     return jsonify({
             SELECT agent, MAX(primary_metric) AS p, COUNT(*) AS n,
                    MIN(submitted_at) AS f
             FROM submissions
+            WHERE task = ? AND primary_metric > -1
             GROUP BY agent ORDER BY p DESC
         """, (name,)).fetchall()
         n_rows_cfg = s.get("n_rows")