Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
Handle hf_token for local runs
Browse files- yourbench_space/app.py +17 -14
yourbench_space/app.py
CHANGED
|
@@ -146,16 +146,19 @@ def run_evaluation_pipeline(oauth_token: gr.OAuthToken | None, org_name, eval_na
|
|
| 146 |
repo_id = f"{org_name}/leaderboard_yourbench_{eval_ds_name.replace('/', '_')}"
|
| 147 |
folder_path = str(Path(PATH) / "yourbench_space" / "leaderboard_space")
|
| 148 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 149 |
try:
|
| 150 |
-
load_dataset(eval_ds_name, name=config_name, streaming=True, token=
|
| 151 |
except Exception as e:
|
| 152 |
logger.error(f"Failed to load dataset '{eval_ds_name}': {e}")
|
| 153 |
return "β Failed: Dataset loading error"
|
| 154 |
|
| 155 |
-
new_env = os.environ.copy()
|
| 156 |
-
if oauth_token:
|
| 157 |
-
new_env["HF_TOKEN"] = oauth_token.token
|
| 158 |
-
|
| 159 |
try:
|
| 160 |
create_eval_file(eval_ds_name)
|
| 161 |
status = asyncio.run(run_evaluations(org=org_name, eval_ds_name=eval_ds_name, custom_env=new_env))
|
|
@@ -171,18 +174,18 @@ def run_evaluation_pipeline(oauth_token: gr.OAuthToken | None, org_name, eval_na
|
|
| 171 |
repo_id=repo_id,
|
| 172 |
repo_type="space",
|
| 173 |
space_sdk="gradio",
|
| 174 |
-
token=
|
| 175 |
)
|
| 176 |
except Exception as e:
|
| 177 |
if "409" in str(e) and "already created this space repo" in str(e):
|
| 178 |
logger.info(f"Space '{repo_id}' already exists. Deleting and regenerating it.")
|
| 179 |
try:
|
| 180 |
-
api.delete_repo(repo_id=repo_id, repo_type="space", token=
|
| 181 |
api.create_repo(
|
| 182 |
repo_id=repo_id,
|
| 183 |
repo_type="space",
|
| 184 |
space_sdk="gradio",
|
| 185 |
-
token=
|
| 186 |
)
|
| 187 |
space_was_regenerated = True
|
| 188 |
except Exception as delete_err:
|
|
@@ -197,16 +200,16 @@ def run_evaluation_pipeline(oauth_token: gr.OAuthToken | None, org_name, eval_na
|
|
| 197 |
repo_id=repo_id,
|
| 198 |
repo_type="space",
|
| 199 |
folder_path=folder_path,
|
| 200 |
-
token=
|
| 201 |
)
|
| 202 |
api.add_space_secret(
|
| 203 |
repo_id=repo_id,
|
| 204 |
key="HF_TOKEN",
|
| 205 |
-
value=
|
| 206 |
-
token=
|
| 207 |
)
|
| 208 |
-
api.add_space_variable(repo_id=repo_id, key="TASK", value=eval_ds_name, token=
|
| 209 |
-
api.add_space_variable(repo_id=repo_id, key="ORG_NAME", value=org_name, token=
|
| 210 |
except Exception as e:
|
| 211 |
logger.error(f"Failed during space setup: {e}")
|
| 212 |
return f"β
Evaluation succeeded\nβ Failed: Space setup error\n{e}"
|
|
@@ -247,7 +250,7 @@ def init_session(profile: gr.OAuthProfile | None):
|
|
| 247 |
btn_launch_evals = gr.Button(
|
| 248 |
"π Launch Evaluation",
|
| 249 |
visible=True,
|
| 250 |
-
interactive=
|
| 251 |
variant="primary",
|
| 252 |
)
|
| 253 |
|
|
|
|
| 146 |
repo_id = f"{org_name}/leaderboard_yourbench_{eval_ds_name.replace('/', '_')}"
|
| 147 |
folder_path = str(Path(PATH) / "yourbench_space" / "leaderboard_space")
|
| 148 |
|
| 149 |
+
new_env = os.environ.copy()
|
| 150 |
+
if oauth_token:
|
| 151 |
+
hf_token = oauth_token.token
|
| 152 |
+
new_env["HF_TOKEN"] = hf_token
|
| 153 |
+
else:
|
| 154 |
+
hf_token = os.environ.get("HF_TOKEN")
|
| 155 |
+
|
| 156 |
try:
|
| 157 |
+
load_dataset(eval_ds_name, name=config_name, streaming=True, token=hf_token)
|
| 158 |
except Exception as e:
|
| 159 |
logger.error(f"Failed to load dataset '{eval_ds_name}': {e}")
|
| 160 |
return "β Failed: Dataset loading error"
|
| 161 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 162 |
try:
|
| 163 |
create_eval_file(eval_ds_name)
|
| 164 |
status = asyncio.run(run_evaluations(org=org_name, eval_ds_name=eval_ds_name, custom_env=new_env))
|
|
|
|
| 174 |
repo_id=repo_id,
|
| 175 |
repo_type="space",
|
| 176 |
space_sdk="gradio",
|
| 177 |
+
token=hf_token,
|
| 178 |
)
|
| 179 |
except Exception as e:
|
| 180 |
if "409" in str(e) and "already created this space repo" in str(e):
|
| 181 |
logger.info(f"Space '{repo_id}' already exists. Deleting and regenerating it.")
|
| 182 |
try:
|
| 183 |
+
api.delete_repo(repo_id=repo_id, repo_type="space", token=hf_token)
|
| 184 |
api.create_repo(
|
| 185 |
repo_id=repo_id,
|
| 186 |
repo_type="space",
|
| 187 |
space_sdk="gradio",
|
| 188 |
+
token=hf_token,
|
| 189 |
)
|
| 190 |
space_was_regenerated = True
|
| 191 |
except Exception as delete_err:
|
|
|
|
| 200 |
repo_id=repo_id,
|
| 201 |
repo_type="space",
|
| 202 |
folder_path=folder_path,
|
| 203 |
+
token=hf_token,
|
| 204 |
)
|
| 205 |
api.add_space_secret(
|
| 206 |
repo_id=repo_id,
|
| 207 |
key="HF_TOKEN",
|
| 208 |
+
value=hf_token,
|
| 209 |
+
token=hf_token,
|
| 210 |
)
|
| 211 |
+
api.add_space_variable(repo_id=repo_id, key="TASK", value=eval_ds_name, token=hf_token)
|
| 212 |
+
api.add_space_variable(repo_id=repo_id, key="ORG_NAME", value=org_name, token=hf_token)
|
| 213 |
except Exception as e:
|
| 214 |
logger.error(f"Failed during space setup: {e}")
|
| 215 |
return f"β
Evaluation succeeded\nβ Failed: Space setup error\n{e}"
|
|
|
|
| 250 |
btn_launch_evals = gr.Button(
|
| 251 |
"π Launch Evaluation",
|
| 252 |
visible=True,
|
| 253 |
+
interactive=True, # Start non-interactive
|
| 254 |
variant="primary",
|
| 255 |
)
|
| 256 |
|