Spaces:

Hrant
/

leaderboarder-builder

Sleeping

Hrant commited on Mar 1

Commit

a4b35cf

verified ·

1 Parent(s): 54e943f

Update leaderboard via Leaderboarder

Files changed (4) hide show

app.py CHANGED Viewed

@@ -55,12 +55,15 @@ def run_build_and_deploy(
     run_id = datetime.now(timezone.utc).strftime("%Y%m%d-%H%M%S")
     base_slug = slugify(benchmark_input)
     output_dir = WORKDIR / f"{base_slug}-{run_id}"
-    summary = pipeline.run(
-        input_value=benchmark_input,
-        output_dir=str(output_dir),
-        max_citations=int(max_citations),
-        read_citations=int(read_citations),
-    )
     owner = resolve_owner(settings.hf_token)
     if not owner:
@@ -72,12 +75,15 @@ def run_build_and_deploy(
         target_space = f"{owner}/leaderboarder-{slugify(summary.benchmark_name)}"
     generate_space_artifacts(Path(summary.output_dir), summary.benchmark_name)
-    deployed_url = deploy_to_hf_space(
-        output_dir=Path(summary.output_dir),
-        space_id=target_space,
-        hf_token=settings.hf_token,
-        private=bool(private_space),
-    )
     csv_path = Path(summary.output_dir) / "leaderboard.csv"
     preview = pd.read_csv(csv_path).head(25) if csv_path.exists() else pd.DataFrame()

     run_id = datetime.now(timezone.utc).strftime("%Y%m%d-%H%M%S")
     base_slug = slugify(benchmark_input)
     output_dir = WORKDIR / f"{base_slug}-{run_id}"
+    try:
+        summary = pipeline.run(
+            input_value=benchmark_input,
+            output_dir=str(output_dir),
+            max_citations=int(max_citations),
+            read_citations=int(read_citations),
+        )
+    except Exception as exc:
+        return f"Build failed: {exc}", "", pd.DataFrame()
     owner = resolve_owner(settings.hf_token)
     if not owner:
         target_space = f"{owner}/leaderboarder-{slugify(summary.benchmark_name)}"
     generate_space_artifacts(Path(summary.output_dir), summary.benchmark_name)
+    try:
+        deployed_url = deploy_to_hf_space(
+            output_dir=Path(summary.output_dir),
+            space_id=target_space,
+            hf_token=settings.hf_token,
+            private=bool(private_space),
+        )
+    except Exception as exc:
+        return f"Deployment failed: {exc}", json.dumps(summary.to_dict(), indent=2, ensure_ascii=False), pd.DataFrame()
     csv_path = Path(summary.output_dir) / "leaderboard.csv"
     preview = pd.read_csv(csv_path).head(25) if csv_path.exists() else pd.DataFrame()

leaderboarder/deploy.py CHANGED Viewed

@@ -78,6 +78,7 @@ demo.launch()
 SPACE_REQUIREMENTS = """gradio>=4.44.0
 pandas>=2.2.2
 """
 BUILDER_SPACE_REQUIREMENTS = """gradio>=4.44.0
@@ -89,6 +90,7 @@ pyarrow>=16.1.0
 pypdf>=4.3.1
 python-dotenv>=1.0.1
 requests>=2.32.3
 trafilatura>=1.12.2
 """
@@ -149,12 +151,15 @@ def run_build_and_deploy(
     run_id = datetime.now(timezone.utc).strftime("%Y%m%d-%H%M%S")
     base_slug = slugify(benchmark_input)
     output_dir = WORKDIR / f"{base_slug}-{run_id}"
-    summary = pipeline.run(
-        input_value=benchmark_input,
-        output_dir=str(output_dir),
-        max_citations=int(max_citations),
-        read_citations=int(read_citations),
-    )
     owner = resolve_owner(settings.hf_token)
     if not owner:
@@ -166,12 +171,15 @@ def run_build_and_deploy(
         target_space = f"{owner}/leaderboarder-{slugify(summary.benchmark_name)}"
     generate_space_artifacts(Path(summary.output_dir), summary.benchmark_name)
-    deployed_url = deploy_to_hf_space(
-        output_dir=Path(summary.output_dir),
-        space_id=target_space,
-        hf_token=settings.hf_token,
-        private=bool(private_space),
-    )
     csv_path = Path(summary.output_dir) / "leaderboard.csv"
     preview = pd.read_csv(csv_path).head(25) if csv_path.exists() else pd.DataFrame()

 SPACE_REQUIREMENTS = """gradio>=4.44.0
 pandas>=2.2.2
+tabulate>=0.9.0
 """
 BUILDER_SPACE_REQUIREMENTS = """gradio>=4.44.0
 pypdf>=4.3.1
 python-dotenv>=1.0.1
 requests>=2.32.3
+tabulate>=0.9.0
 trafilatura>=1.12.2
 """
     run_id = datetime.now(timezone.utc).strftime("%Y%m%d-%H%M%S")
     base_slug = slugify(benchmark_input)
     output_dir = WORKDIR / f"{base_slug}-{run_id}"
+    try:
+        summary = pipeline.run(
+            input_value=benchmark_input,
+            output_dir=str(output_dir),
+            max_citations=int(max_citations),
+            read_citations=int(read_citations),
+        )
+    except Exception as exc:
+        return f"Build failed: {exc}", "", pd.DataFrame()
     owner = resolve_owner(settings.hf_token)
     if not owner:
         target_space = f"{owner}/leaderboarder-{slugify(summary.benchmark_name)}"
     generate_space_artifacts(Path(summary.output_dir), summary.benchmark_name)
+    try:
+        deployed_url = deploy_to_hf_space(
+            output_dir=Path(summary.output_dir),
+            space_id=target_space,
+            hf_token=settings.hf_token,
+            private=bool(private_space),
+        )
+    except Exception as exc:
+        return f"Deployment failed: {exc}", json.dumps(summary.to_dict(), indent=2, ensure_ascii=False), pd.DataFrame()
     csv_path = Path(summary.output_dir) / "leaderboard.csv"
     preview = pd.read_csv(csv_path).head(25) if csv_path.exists() else pd.DataFrame()

leaderboarder/storage.py CHANGED Viewed

@@ -97,7 +97,7 @@ def save_leaderboard(
     public_frame.to_csv(csv_path, index=False)
     public_frame.to_json(json_path, orient="records", indent=2, force_ascii=False)
     public_frame.to_parquet(parquet_path, index=False)
-    md_path.write_text(public_frame.to_markdown(index=False), encoding="utf-8")
     frame.to_json(raw_json_path, orient="records", indent=2, force_ascii=False)
     return {
@@ -220,3 +220,11 @@ def _unique_preserve_order(values: list[str]) -> list[str]:
         seen.add(item)
         out.append(item)
     return out

     public_frame.to_csv(csv_path, index=False)
     public_frame.to_json(json_path, orient="records", indent=2, force_ascii=False)
     public_frame.to_parquet(parquet_path, index=False)
+    md_path.write_text(_to_markdown_safe(public_frame), encoding="utf-8")
     frame.to_json(raw_json_path, orient="records", indent=2, force_ascii=False)
     return {
         seen.add(item)
         out.append(item)
     return out
+def _to_markdown_safe(frame: pd.DataFrame) -> str:
+    try:
+        return frame.to_markdown(index=False)
+    except Exception:
+        # Fallback when optional dependency `tabulate` is unavailable.
+        return frame.to_csv(index=False)

requirements.txt CHANGED Viewed

@@ -7,4 +7,5 @@ pyarrow>=16.1.0
 pypdf>=4.3.1
 python-dotenv>=1.0.1
 requests>=2.32.3
 trafilatura>=1.12.2

 pypdf>=4.3.1
 python-dotenv>=1.0.1
 requests>=2.32.3
+tabulate>=0.9.0
 trafilatura>=1.12.2