MrA7A3 commited on
Commit
dc4901c
·
verified ·
1 Parent(s): 2346083

KAPO hf runtime finalizer

Browse files
Files changed (4) hide show
  1. .env +6 -6
  2. bootstrap_space_runtime.py +6 -6
  3. brain_server/api/main.py +4 -1
  4. kapo.env +6 -6
.env CHANGED
@@ -8,21 +8,21 @@ BRAIN_ROLES=debugger,fallback
8
  BRAIN_TEMPLATE=hf-space-cpu
9
  BRAIN_TUNNEL_PROVIDER=none
10
  FIREBASE_ENABLED=0
11
- GOOGLE_DRIVE_BOOTSTRAP_URL=https://drive.google.com/uc?export=download&id=19jyBWsQ9ciJVPi2PUigu5ti3gJ24A6TG
12
  HF_ACCELERATOR=cpu
13
  HF_SPACE_DOCKER=1
14
  KAGGLE_AUTO_BOOTSTRAP=0
15
- KAPO_BOOTSTRAP_URL=https://drive.google.com/uc?export=download&id=19jyBWsQ9ciJVPi2PUigu5ti3gJ24A6TG
16
  KAPO_COMPUTE_PROFILE=cpu
17
  KAPO_DISABLE_EMBEDDINGS=1
18
  KAPO_HF_INFERENCE_API=0
19
  KAPO_HF_TRANSFORMERS_RUNTIME=1
20
  KAPO_LAZY_EMBED_STARTUP=1
21
  KAPO_LAZY_MODEL_STARTUP=1
22
- KAPO_PATCH_BUNDLE_URL=https://drive.google.com/uc?export=download&id=1dj3gorVxheXtEjDqydavLkN-qtEJz158
23
- KAPO_PATCH_MANIFEST_URL=https://drive.google.com/uc?export=download&id=1dD1YCMloO4bRruWO4r0QJaMxfIsRDyNb
24
- KAPO_REMOTE_ENV_PASSWORD_B64=SGhwOW1BdWt1UFNyd1pYTlJPckFHZjA2ZVVJTXZYTmo
25
- KAPO_REMOTE_ENV_URL_B64=aHR0cHM6Ly9kcml2ZS5nb29nbGUuY29tL3VjP2V4cG9ydD1kb3dubG9hZCZpZD0xdFI4XzdxVTFxNDBnWjBpS1BRWXFPemtGRmlJeWFOQ0U
26
  KAPO_SHARED_STATE_BACKEND=google_drive
27
  MODEL_PROFILE_ID=hf-debugger-qwen25-7b-instruct
28
  MODEL_REPO=Qwen/Qwen2.5-1.5B-Instruct
 
8
  BRAIN_TEMPLATE=hf-space-cpu
9
  BRAIN_TUNNEL_PROVIDER=none
10
  FIREBASE_ENABLED=0
11
+ GOOGLE_DRIVE_BOOTSTRAP_URL=https://drive.google.com/uc?export=download&id=1cTITRABqhuRUyCaHFRA8p3wGNQeU0DK-
12
  HF_ACCELERATOR=cpu
13
  HF_SPACE_DOCKER=1
14
  KAGGLE_AUTO_BOOTSTRAP=0
15
+ KAPO_BOOTSTRAP_URL=https://drive.google.com/uc?export=download&id=1cTITRABqhuRUyCaHFRA8p3wGNQeU0DK-
16
  KAPO_COMPUTE_PROFILE=cpu
17
  KAPO_DISABLE_EMBEDDINGS=1
18
  KAPO_HF_INFERENCE_API=0
19
  KAPO_HF_TRANSFORMERS_RUNTIME=1
20
  KAPO_LAZY_EMBED_STARTUP=1
21
  KAPO_LAZY_MODEL_STARTUP=1
22
+ KAPO_PATCH_BUNDLE_URL=https://drive.google.com/uc?export=download&id=1be4XGzTO4qm-V3HNuMKZNXD_3Ws-iF9H
23
+ KAPO_PATCH_MANIFEST_URL=https://drive.google.com/uc?export=download&id=1vt8VQ034HjoCzC5SBZcDNK4mclZJzKjv
24
+ KAPO_REMOTE_ENV_PASSWORD_B64=UTBkdEM5R1FxYXRScEp3S3U5dkhMUWtQaC1IY0NjSm8
25
+ KAPO_REMOTE_ENV_URL_B64=aHR0cHM6Ly9kcml2ZS5nb29nbGUuY29tL3VjP2V4cG9ydD1kb3dubG9hZCZpZD0xNUw5UXAzS3E0ZTZ5RVg4VHlFLVRZMks0ZHJnMWhCUEc
26
  KAPO_SHARED_STATE_BACKEND=google_drive
27
  MODEL_PROFILE_ID=hf-debugger-qwen25-7b-instruct
28
  MODEL_REPO=Qwen/Qwen2.5-1.5B-Instruct
bootstrap_space_runtime.py CHANGED
@@ -16,21 +16,21 @@ DEFAULT_ENV = {
16
  "BRAIN_TEMPLATE": "hf-space-cpu",
17
  "BRAIN_TUNNEL_PROVIDER": "none",
18
  "FIREBASE_ENABLED": "0",
19
- "GOOGLE_DRIVE_BOOTSTRAP_URL": "https://drive.google.com/uc?export=download&id=19jyBWsQ9ciJVPi2PUigu5ti3gJ24A6TG",
20
  "HF_ACCELERATOR": "cpu",
21
  "HF_SPACE_DOCKER": "1",
22
  "KAGGLE_AUTO_BOOTSTRAP": "0",
23
- "KAPO_BOOTSTRAP_URL": "https://drive.google.com/uc?export=download&id=19jyBWsQ9ciJVPi2PUigu5ti3gJ24A6TG",
24
  "KAPO_COMPUTE_PROFILE": "cpu",
25
  "KAPO_DISABLE_EMBEDDINGS": "1",
26
  "KAPO_HF_INFERENCE_API": "0",
27
  "KAPO_HF_TRANSFORMERS_RUNTIME": "1",
28
  "KAPO_LAZY_EMBED_STARTUP": "1",
29
  "KAPO_LAZY_MODEL_STARTUP": "1",
30
- "KAPO_PATCH_BUNDLE_URL": "https://drive.google.com/uc?export=download&id=1dj3gorVxheXtEjDqydavLkN-qtEJz158",
31
- "KAPO_PATCH_MANIFEST_URL": "https://drive.google.com/uc?export=download&id=1dD1YCMloO4bRruWO4r0QJaMxfIsRDyNb",
32
- "KAPO_REMOTE_ENV_PASSWORD_B64": "SGhwOW1BdWt1UFNyd1pYTlJPckFHZjA2ZVVJTXZYTmo",
33
- "KAPO_REMOTE_ENV_URL_B64": "aHR0cHM6Ly9kcml2ZS5nb29nbGUuY29tL3VjP2V4cG9ydD1kb3dubG9hZCZpZD0xdFI4XzdxVTFxNDBnWjBpS1BRWXFPemtGRmlJeWFOQ0U",
34
  "KAPO_SHARED_STATE_BACKEND": "google_drive",
35
  "MODEL_PROFILE_ID": "hf-debugger-qwen25-7b-instruct",
36
  "MODEL_REPO": "Qwen/Qwen2.5-1.5B-Instruct",
 
16
  "BRAIN_TEMPLATE": "hf-space-cpu",
17
  "BRAIN_TUNNEL_PROVIDER": "none",
18
  "FIREBASE_ENABLED": "0",
19
+ "GOOGLE_DRIVE_BOOTSTRAP_URL": "https://drive.google.com/uc?export=download&id=1cTITRABqhuRUyCaHFRA8p3wGNQeU0DK-",
20
  "HF_ACCELERATOR": "cpu",
21
  "HF_SPACE_DOCKER": "1",
22
  "KAGGLE_AUTO_BOOTSTRAP": "0",
23
+ "KAPO_BOOTSTRAP_URL": "https://drive.google.com/uc?export=download&id=1cTITRABqhuRUyCaHFRA8p3wGNQeU0DK-",
24
  "KAPO_COMPUTE_PROFILE": "cpu",
25
  "KAPO_DISABLE_EMBEDDINGS": "1",
26
  "KAPO_HF_INFERENCE_API": "0",
27
  "KAPO_HF_TRANSFORMERS_RUNTIME": "1",
28
  "KAPO_LAZY_EMBED_STARTUP": "1",
29
  "KAPO_LAZY_MODEL_STARTUP": "1",
30
+ "KAPO_PATCH_BUNDLE_URL": "https://drive.google.com/uc?export=download&id=1be4XGzTO4qm-V3HNuMKZNXD_3Ws-iF9H",
31
+ "KAPO_PATCH_MANIFEST_URL": "https://drive.google.com/uc?export=download&id=1vt8VQ034HjoCzC5SBZcDNK4mclZJzKjv",
32
+ "KAPO_REMOTE_ENV_PASSWORD_B64": "UTBkdEM5R1FxYXRScEp3S3U5dkhMUWtQaC1IY0NjSm8",
33
+ "KAPO_REMOTE_ENV_URL_B64": "aHR0cHM6Ly9kcml2ZS5nb29nbGUuY29tL3VjP2V4cG9ydD1kb3dubG9hZCZpZD0xNUw5UXAzS3E0ZTZ5RVg4VHlFLVRZMks0ZHJnMWhCUEc",
34
  "KAPO_SHARED_STATE_BACKEND": "google_drive",
35
  "MODEL_PROFILE_ID": "hf-debugger-qwen25-7b-instruct",
36
  "MODEL_REPO": "Qwen/Qwen2.5-1.5B-Instruct",
brain_server/api/main.py CHANGED
@@ -287,6 +287,9 @@ def _load_default_model() -> None:
287
  if _hf_transformers_runtime_enabled():
288
  ensure_model_loaded(repo_id, filename, hf_token=os.getenv("HF_TOKEN"))
289
  return
 
 
 
290
  if not filename and (_feature_enabled("KAPO_HF_INFERENCE_API", default=False) or "huggingface" in provider or "hf-space" in provider):
291
  MODEL = None
292
  MODEL_ERROR = None
@@ -2314,7 +2317,7 @@ def ensure_model_loaded(repo_id: str, filename: str, hf_token: str | None = None
2314
  MODEL = None
2315
  MODEL_ERROR = 'model repo missing'
2316
  return
2317
- if _kapo_hf_transformers_enabled():
2318
  try:
2319
  from transformers import AutoModelForCausalLM, AutoTokenizer
2320
  tokenizer = AutoTokenizer.from_pretrained(repo_id, token=hf_token, trust_remote_code=True)
 
287
  if _hf_transformers_runtime_enabled():
288
  ensure_model_loaded(repo_id, filename, hf_token=os.getenv("HF_TOKEN"))
289
  return
290
+ if not filename and ("huggingface" in provider or "hf-space" in provider):
291
+ ensure_model_loaded(repo_id, filename, hf_token=os.getenv("HF_TOKEN"))
292
+ return
293
  if not filename and (_feature_enabled("KAPO_HF_INFERENCE_API", default=False) or "huggingface" in provider or "hf-space" in provider):
294
  MODEL = None
295
  MODEL_ERROR = None
 
2317
  MODEL = None
2318
  MODEL_ERROR = 'model repo missing'
2319
  return
2320
+ if _kapo_hf_transformers_enabled() or (_is_hf_space_runtime() and not filename):
2321
  try:
2322
  from transformers import AutoModelForCausalLM, AutoTokenizer
2323
  tokenizer = AutoTokenizer.from_pretrained(repo_id, token=hf_token, trust_remote_code=True)
kapo.env CHANGED
@@ -8,21 +8,21 @@ BRAIN_ROLES=debugger,fallback
8
  BRAIN_TEMPLATE=hf-space-cpu
9
  BRAIN_TUNNEL_PROVIDER=none
10
  FIREBASE_ENABLED=0
11
- GOOGLE_DRIVE_BOOTSTRAP_URL=https://drive.google.com/uc?export=download&id=19jyBWsQ9ciJVPi2PUigu5ti3gJ24A6TG
12
  HF_ACCELERATOR=cpu
13
  HF_SPACE_DOCKER=1
14
  KAGGLE_AUTO_BOOTSTRAP=0
15
- KAPO_BOOTSTRAP_URL=https://drive.google.com/uc?export=download&id=19jyBWsQ9ciJVPi2PUigu5ti3gJ24A6TG
16
  KAPO_COMPUTE_PROFILE=cpu
17
  KAPO_DISABLE_EMBEDDINGS=1
18
  KAPO_HF_INFERENCE_API=0
19
  KAPO_HF_TRANSFORMERS_RUNTIME=1
20
  KAPO_LAZY_EMBED_STARTUP=1
21
  KAPO_LAZY_MODEL_STARTUP=1
22
- KAPO_PATCH_BUNDLE_URL=https://drive.google.com/uc?export=download&id=1dj3gorVxheXtEjDqydavLkN-qtEJz158
23
- KAPO_PATCH_MANIFEST_URL=https://drive.google.com/uc?export=download&id=1dD1YCMloO4bRruWO4r0QJaMxfIsRDyNb
24
- KAPO_REMOTE_ENV_PASSWORD_B64=SGhwOW1BdWt1UFNyd1pYTlJPckFHZjA2ZVVJTXZYTmo
25
- KAPO_REMOTE_ENV_URL_B64=aHR0cHM6Ly9kcml2ZS5nb29nbGUuY29tL3VjP2V4cG9ydD1kb3dubG9hZCZpZD0xdFI4XzdxVTFxNDBnWjBpS1BRWXFPemtGRmlJeWFOQ0U
26
  KAPO_SHARED_STATE_BACKEND=google_drive
27
  MODEL_PROFILE_ID=hf-debugger-qwen25-7b-instruct
28
  MODEL_REPO=Qwen/Qwen2.5-1.5B-Instruct
 
8
  BRAIN_TEMPLATE=hf-space-cpu
9
  BRAIN_TUNNEL_PROVIDER=none
10
  FIREBASE_ENABLED=0
11
+ GOOGLE_DRIVE_BOOTSTRAP_URL=https://drive.google.com/uc?export=download&id=1cTITRABqhuRUyCaHFRA8p3wGNQeU0DK-
12
  HF_ACCELERATOR=cpu
13
  HF_SPACE_DOCKER=1
14
  KAGGLE_AUTO_BOOTSTRAP=0
15
+ KAPO_BOOTSTRAP_URL=https://drive.google.com/uc?export=download&id=1cTITRABqhuRUyCaHFRA8p3wGNQeU0DK-
16
  KAPO_COMPUTE_PROFILE=cpu
17
  KAPO_DISABLE_EMBEDDINGS=1
18
  KAPO_HF_INFERENCE_API=0
19
  KAPO_HF_TRANSFORMERS_RUNTIME=1
20
  KAPO_LAZY_EMBED_STARTUP=1
21
  KAPO_LAZY_MODEL_STARTUP=1
22
+ KAPO_PATCH_BUNDLE_URL=https://drive.google.com/uc?export=download&id=1be4XGzTO4qm-V3HNuMKZNXD_3Ws-iF9H
23
+ KAPO_PATCH_MANIFEST_URL=https://drive.google.com/uc?export=download&id=1vt8VQ034HjoCzC5SBZcDNK4mclZJzKjv
24
+ KAPO_REMOTE_ENV_PASSWORD_B64=UTBkdEM5R1FxYXRScEp3S3U5dkhMUWtQaC1IY0NjSm8
25
+ KAPO_REMOTE_ENV_URL_B64=aHR0cHM6Ly9kcml2ZS5nb29nbGUuY29tL3VjP2V4cG9ydD1kb3dubG9hZCZpZD0xNUw5UXAzS3E0ZTZ5RVg4VHlFLVRZMks0ZHJnMWhCUEc
26
  KAPO_SHARED_STATE_BACKEND=google_drive
27
  MODEL_PROFILE_ID=hf-debugger-qwen25-7b-instruct
28
  MODEL_REPO=Qwen/Qwen2.5-1.5B-Instruct