Spaces:
Sleeping
Sleeping
KAPO hf runtime finalizer
Browse files- .env +6 -6
- bootstrap_space_runtime.py +6 -6
- brain_server/api/main.py +4 -1
- kapo.env +6 -6
.env
CHANGED
|
@@ -8,21 +8,21 @@ BRAIN_ROLES=debugger,fallback
|
|
| 8 |
BRAIN_TEMPLATE=hf-space-cpu
|
| 9 |
BRAIN_TUNNEL_PROVIDER=none
|
| 10 |
FIREBASE_ENABLED=0
|
| 11 |
-
GOOGLE_DRIVE_BOOTSTRAP_URL=https://drive.google.com/uc?export=download&id=
|
| 12 |
HF_ACCELERATOR=cpu
|
| 13 |
HF_SPACE_DOCKER=1
|
| 14 |
KAGGLE_AUTO_BOOTSTRAP=0
|
| 15 |
-
KAPO_BOOTSTRAP_URL=https://drive.google.com/uc?export=download&id=
|
| 16 |
KAPO_COMPUTE_PROFILE=cpu
|
| 17 |
KAPO_DISABLE_EMBEDDINGS=1
|
| 18 |
KAPO_HF_INFERENCE_API=0
|
| 19 |
KAPO_HF_TRANSFORMERS_RUNTIME=1
|
| 20 |
KAPO_LAZY_EMBED_STARTUP=1
|
| 21 |
KAPO_LAZY_MODEL_STARTUP=1
|
| 22 |
-
KAPO_PATCH_BUNDLE_URL=https://drive.google.com/uc?export=download&id=
|
| 23 |
-
KAPO_PATCH_MANIFEST_URL=https://drive.google.com/uc?export=download&id=
|
| 24 |
-
KAPO_REMOTE_ENV_PASSWORD_B64=
|
| 25 |
-
KAPO_REMOTE_ENV_URL_B64=
|
| 26 |
KAPO_SHARED_STATE_BACKEND=google_drive
|
| 27 |
MODEL_PROFILE_ID=hf-debugger-qwen25-7b-instruct
|
| 28 |
MODEL_REPO=Qwen/Qwen2.5-1.5B-Instruct
|
|
|
|
| 8 |
BRAIN_TEMPLATE=hf-space-cpu
|
| 9 |
BRAIN_TUNNEL_PROVIDER=none
|
| 10 |
FIREBASE_ENABLED=0
|
| 11 |
+
GOOGLE_DRIVE_BOOTSTRAP_URL=https://drive.google.com/uc?export=download&id=1cTITRABqhuRUyCaHFRA8p3wGNQeU0DK-
|
| 12 |
HF_ACCELERATOR=cpu
|
| 13 |
HF_SPACE_DOCKER=1
|
| 14 |
KAGGLE_AUTO_BOOTSTRAP=0
|
| 15 |
+
KAPO_BOOTSTRAP_URL=https://drive.google.com/uc?export=download&id=1cTITRABqhuRUyCaHFRA8p3wGNQeU0DK-
|
| 16 |
KAPO_COMPUTE_PROFILE=cpu
|
| 17 |
KAPO_DISABLE_EMBEDDINGS=1
|
| 18 |
KAPO_HF_INFERENCE_API=0
|
| 19 |
KAPO_HF_TRANSFORMERS_RUNTIME=1
|
| 20 |
KAPO_LAZY_EMBED_STARTUP=1
|
| 21 |
KAPO_LAZY_MODEL_STARTUP=1
|
| 22 |
+
KAPO_PATCH_BUNDLE_URL=https://drive.google.com/uc?export=download&id=1be4XGzTO4qm-V3HNuMKZNXD_3Ws-iF9H
|
| 23 |
+
KAPO_PATCH_MANIFEST_URL=https://drive.google.com/uc?export=download&id=1vt8VQ034HjoCzC5SBZcDNK4mclZJzKjv
|
| 24 |
+
KAPO_REMOTE_ENV_PASSWORD_B64=UTBkdEM5R1FxYXRScEp3S3U5dkhMUWtQaC1IY0NjSm8
|
| 25 |
+
KAPO_REMOTE_ENV_URL_B64=aHR0cHM6Ly9kcml2ZS5nb29nbGUuY29tL3VjP2V4cG9ydD1kb3dubG9hZCZpZD0xNUw5UXAzS3E0ZTZ5RVg4VHlFLVRZMks0ZHJnMWhCUEc
|
| 26 |
KAPO_SHARED_STATE_BACKEND=google_drive
|
| 27 |
MODEL_PROFILE_ID=hf-debugger-qwen25-7b-instruct
|
| 28 |
MODEL_REPO=Qwen/Qwen2.5-1.5B-Instruct
|
bootstrap_space_runtime.py
CHANGED
|
@@ -16,21 +16,21 @@ DEFAULT_ENV = {
|
|
| 16 |
"BRAIN_TEMPLATE": "hf-space-cpu",
|
| 17 |
"BRAIN_TUNNEL_PROVIDER": "none",
|
| 18 |
"FIREBASE_ENABLED": "0",
|
| 19 |
-
"GOOGLE_DRIVE_BOOTSTRAP_URL": "https://drive.google.com/uc?export=download&id=
|
| 20 |
"HF_ACCELERATOR": "cpu",
|
| 21 |
"HF_SPACE_DOCKER": "1",
|
| 22 |
"KAGGLE_AUTO_BOOTSTRAP": "0",
|
| 23 |
-
"KAPO_BOOTSTRAP_URL": "https://drive.google.com/uc?export=download&id=
|
| 24 |
"KAPO_COMPUTE_PROFILE": "cpu",
|
| 25 |
"KAPO_DISABLE_EMBEDDINGS": "1",
|
| 26 |
"KAPO_HF_INFERENCE_API": "0",
|
| 27 |
"KAPO_HF_TRANSFORMERS_RUNTIME": "1",
|
| 28 |
"KAPO_LAZY_EMBED_STARTUP": "1",
|
| 29 |
"KAPO_LAZY_MODEL_STARTUP": "1",
|
| 30 |
-
"KAPO_PATCH_BUNDLE_URL": "https://drive.google.com/uc?export=download&id=
|
| 31 |
-
"KAPO_PATCH_MANIFEST_URL": "https://drive.google.com/uc?export=download&id=
|
| 32 |
-
"KAPO_REMOTE_ENV_PASSWORD_B64": "
|
| 33 |
-
"KAPO_REMOTE_ENV_URL_B64": "
|
| 34 |
"KAPO_SHARED_STATE_BACKEND": "google_drive",
|
| 35 |
"MODEL_PROFILE_ID": "hf-debugger-qwen25-7b-instruct",
|
| 36 |
"MODEL_REPO": "Qwen/Qwen2.5-1.5B-Instruct",
|
|
|
|
| 16 |
"BRAIN_TEMPLATE": "hf-space-cpu",
|
| 17 |
"BRAIN_TUNNEL_PROVIDER": "none",
|
| 18 |
"FIREBASE_ENABLED": "0",
|
| 19 |
+
"GOOGLE_DRIVE_BOOTSTRAP_URL": "https://drive.google.com/uc?export=download&id=1cTITRABqhuRUyCaHFRA8p3wGNQeU0DK-",
|
| 20 |
"HF_ACCELERATOR": "cpu",
|
| 21 |
"HF_SPACE_DOCKER": "1",
|
| 22 |
"KAGGLE_AUTO_BOOTSTRAP": "0",
|
| 23 |
+
"KAPO_BOOTSTRAP_URL": "https://drive.google.com/uc?export=download&id=1cTITRABqhuRUyCaHFRA8p3wGNQeU0DK-",
|
| 24 |
"KAPO_COMPUTE_PROFILE": "cpu",
|
| 25 |
"KAPO_DISABLE_EMBEDDINGS": "1",
|
| 26 |
"KAPO_HF_INFERENCE_API": "0",
|
| 27 |
"KAPO_HF_TRANSFORMERS_RUNTIME": "1",
|
| 28 |
"KAPO_LAZY_EMBED_STARTUP": "1",
|
| 29 |
"KAPO_LAZY_MODEL_STARTUP": "1",
|
| 30 |
+
"KAPO_PATCH_BUNDLE_URL": "https://drive.google.com/uc?export=download&id=1be4XGzTO4qm-V3HNuMKZNXD_3Ws-iF9H",
|
| 31 |
+
"KAPO_PATCH_MANIFEST_URL": "https://drive.google.com/uc?export=download&id=1vt8VQ034HjoCzC5SBZcDNK4mclZJzKjv",
|
| 32 |
+
"KAPO_REMOTE_ENV_PASSWORD_B64": "UTBkdEM5R1FxYXRScEp3S3U5dkhMUWtQaC1IY0NjSm8",
|
| 33 |
+
"KAPO_REMOTE_ENV_URL_B64": "aHR0cHM6Ly9kcml2ZS5nb29nbGUuY29tL3VjP2V4cG9ydD1kb3dubG9hZCZpZD0xNUw5UXAzS3E0ZTZ5RVg4VHlFLVRZMks0ZHJnMWhCUEc",
|
| 34 |
"KAPO_SHARED_STATE_BACKEND": "google_drive",
|
| 35 |
"MODEL_PROFILE_ID": "hf-debugger-qwen25-7b-instruct",
|
| 36 |
"MODEL_REPO": "Qwen/Qwen2.5-1.5B-Instruct",
|
brain_server/api/main.py
CHANGED
|
@@ -287,6 +287,9 @@ def _load_default_model() -> None:
|
|
| 287 |
if _hf_transformers_runtime_enabled():
|
| 288 |
ensure_model_loaded(repo_id, filename, hf_token=os.getenv("HF_TOKEN"))
|
| 289 |
return
|
|
|
|
|
|
|
|
|
|
| 290 |
if not filename and (_feature_enabled("KAPO_HF_INFERENCE_API", default=False) or "huggingface" in provider or "hf-space" in provider):
|
| 291 |
MODEL = None
|
| 292 |
MODEL_ERROR = None
|
|
@@ -2314,7 +2317,7 @@ def ensure_model_loaded(repo_id: str, filename: str, hf_token: str | None = None
|
|
| 2314 |
MODEL = None
|
| 2315 |
MODEL_ERROR = 'model repo missing'
|
| 2316 |
return
|
| 2317 |
-
if _kapo_hf_transformers_enabled():
|
| 2318 |
try:
|
| 2319 |
from transformers import AutoModelForCausalLM, AutoTokenizer
|
| 2320 |
tokenizer = AutoTokenizer.from_pretrained(repo_id, token=hf_token, trust_remote_code=True)
|
|
|
|
| 287 |
if _hf_transformers_runtime_enabled():
|
| 288 |
ensure_model_loaded(repo_id, filename, hf_token=os.getenv("HF_TOKEN"))
|
| 289 |
return
|
| 290 |
+
if not filename and ("huggingface" in provider or "hf-space" in provider):
|
| 291 |
+
ensure_model_loaded(repo_id, filename, hf_token=os.getenv("HF_TOKEN"))
|
| 292 |
+
return
|
| 293 |
if not filename and (_feature_enabled("KAPO_HF_INFERENCE_API", default=False) or "huggingface" in provider or "hf-space" in provider):
|
| 294 |
MODEL = None
|
| 295 |
MODEL_ERROR = None
|
|
|
|
| 2317 |
MODEL = None
|
| 2318 |
MODEL_ERROR = 'model repo missing'
|
| 2319 |
return
|
| 2320 |
+
if _kapo_hf_transformers_enabled() or (_is_hf_space_runtime() and not filename):
|
| 2321 |
try:
|
| 2322 |
from transformers import AutoModelForCausalLM, AutoTokenizer
|
| 2323 |
tokenizer = AutoTokenizer.from_pretrained(repo_id, token=hf_token, trust_remote_code=True)
|
kapo.env
CHANGED
|
@@ -8,21 +8,21 @@ BRAIN_ROLES=debugger,fallback
|
|
| 8 |
BRAIN_TEMPLATE=hf-space-cpu
|
| 9 |
BRAIN_TUNNEL_PROVIDER=none
|
| 10 |
FIREBASE_ENABLED=0
|
| 11 |
-
GOOGLE_DRIVE_BOOTSTRAP_URL=https://drive.google.com/uc?export=download&id=
|
| 12 |
HF_ACCELERATOR=cpu
|
| 13 |
HF_SPACE_DOCKER=1
|
| 14 |
KAGGLE_AUTO_BOOTSTRAP=0
|
| 15 |
-
KAPO_BOOTSTRAP_URL=https://drive.google.com/uc?export=download&id=
|
| 16 |
KAPO_COMPUTE_PROFILE=cpu
|
| 17 |
KAPO_DISABLE_EMBEDDINGS=1
|
| 18 |
KAPO_HF_INFERENCE_API=0
|
| 19 |
KAPO_HF_TRANSFORMERS_RUNTIME=1
|
| 20 |
KAPO_LAZY_EMBED_STARTUP=1
|
| 21 |
KAPO_LAZY_MODEL_STARTUP=1
|
| 22 |
-
KAPO_PATCH_BUNDLE_URL=https://drive.google.com/uc?export=download&id=
|
| 23 |
-
KAPO_PATCH_MANIFEST_URL=https://drive.google.com/uc?export=download&id=
|
| 24 |
-
KAPO_REMOTE_ENV_PASSWORD_B64=
|
| 25 |
-
KAPO_REMOTE_ENV_URL_B64=
|
| 26 |
KAPO_SHARED_STATE_BACKEND=google_drive
|
| 27 |
MODEL_PROFILE_ID=hf-debugger-qwen25-7b-instruct
|
| 28 |
MODEL_REPO=Qwen/Qwen2.5-1.5B-Instruct
|
|
|
|
| 8 |
BRAIN_TEMPLATE=hf-space-cpu
|
| 9 |
BRAIN_TUNNEL_PROVIDER=none
|
| 10 |
FIREBASE_ENABLED=0
|
| 11 |
+
GOOGLE_DRIVE_BOOTSTRAP_URL=https://drive.google.com/uc?export=download&id=1cTITRABqhuRUyCaHFRA8p3wGNQeU0DK-
|
| 12 |
HF_ACCELERATOR=cpu
|
| 13 |
HF_SPACE_DOCKER=1
|
| 14 |
KAGGLE_AUTO_BOOTSTRAP=0
|
| 15 |
+
KAPO_BOOTSTRAP_URL=https://drive.google.com/uc?export=download&id=1cTITRABqhuRUyCaHFRA8p3wGNQeU0DK-
|
| 16 |
KAPO_COMPUTE_PROFILE=cpu
|
| 17 |
KAPO_DISABLE_EMBEDDINGS=1
|
| 18 |
KAPO_HF_INFERENCE_API=0
|
| 19 |
KAPO_HF_TRANSFORMERS_RUNTIME=1
|
| 20 |
KAPO_LAZY_EMBED_STARTUP=1
|
| 21 |
KAPO_LAZY_MODEL_STARTUP=1
|
| 22 |
+
KAPO_PATCH_BUNDLE_URL=https://drive.google.com/uc?export=download&id=1be4XGzTO4qm-V3HNuMKZNXD_3Ws-iF9H
|
| 23 |
+
KAPO_PATCH_MANIFEST_URL=https://drive.google.com/uc?export=download&id=1vt8VQ034HjoCzC5SBZcDNK4mclZJzKjv
|
| 24 |
+
KAPO_REMOTE_ENV_PASSWORD_B64=UTBkdEM5R1FxYXRScEp3S3U5dkhMUWtQaC1IY0NjSm8
|
| 25 |
+
KAPO_REMOTE_ENV_URL_B64=aHR0cHM6Ly9kcml2ZS5nb29nbGUuY29tL3VjP2V4cG9ydD1kb3dubG9hZCZpZD0xNUw5UXAzS3E0ZTZ5RVg4VHlFLVRZMks0ZHJnMWhCUEc
|
| 26 |
KAPO_SHARED_STATE_BACKEND=google_drive
|
| 27 |
MODEL_PROFILE_ID=hf-debugger-qwen25-7b-instruct
|
| 28 |
MODEL_REPO=Qwen/Qwen2.5-1.5B-Instruct
|