Spaces:

cuilabs
/

bee

Paused

bee / scripts /bootstrap_hf_repos.py

Bee Deploy

HF Space backend deploy [de0cba5]

5e21013 5 days ago

7.8 kB

	"""Create the 6 cuilabs/bee-* HF model repos with honest, auditable READMEs.

	This is a one-shot bootstrap. Each repo:
	- Is private at first (we toggle public when adapters are real and validated)
	- Gets a README that states WHAT the repo represents and WHAT'S TRAINED today
	- Does not pretend tiers without compute are "production-ready"

	Mapping mirrors apps/workspace/src/lib/models/catalog.ts (`hf_repo` field):

	bee-cell → cuilabs/bee-cell (active — Kaggle T4 trains here)
	bee-comb → cuilabs/bee-comb (placeholder — same base, larger context)
	bee-hive → cuilabs/bee-hive (placeholder — 3B base, needs paid GPU)
	bee-swarm → cuilabs/bee-swarm (placeholder — 7B+ base, needs paid GPU)
	bee-enclave → cuilabs/bee-enclave (placeholder — deployment mode of Hive/Swarm)
	bee-ignite → cuilabs/bee-ignite (placeholder — experimental R&D track)
	"""
	from __future__ import annotations

	import os

	REPOS = [
	{
	"name": "cuilabs/bee-cell",
	"tagline": "Private AI on your own machine.",
	"tier": "Bee Cell — production tier 1",
	"base_model": "HuggingFaceTB/SmolLM2-360M-Instruct",
	"status": (
	"Active training. This repo holds LoRA adapters trained on "
	"the [`cuilabs/bee-interactions`](https://huggingface.co/datasets/cuilabs/bee-interactions) "
	"dataset by the Kaggle notebook "
	"[`ceocxx/bee-train-online`](https://www.kaggle.com/code/ceocxx/bee-train-online), "
	"kicked daily by the Vercel cron at "
	"`/api/cron/kaggle-dispatch` in the [Bee monorepo](https://github.com/cuilabs/bee). "
	"Adapter branches are named `<domain>/<utc-timestamp>` "
	"(e.g. `general/2026-04-28-1430`)."
	),
	},
	{
	"name": "cuilabs/bee-comb",
	"tagline": "Workstation-grade AI for serious builders.",
	"tier": "Bee Comb — production tier 2",
	"base_model": "(TBD — same family as Cell, larger context)",
	"status": (
	"Placeholder repo. Bee Comb shares Cell's training pipeline "
	"but with a wider context window and higher throughput targets. "
	"No adapters trained yet — we are validating the Cell pipeline "
	"first before scaling up. Once Cell adapters are demonstrably "
	"useful, the same training script will fan out to Comb."
	),
	},
	{
	"name": "cuilabs/bee-hive",
	"tagline": "Team-grade AI for startups and SMBs.",
	"tier": "Bee Hive — production tier 3",
	"base_model": "(TBD — 3B parameter class)",
	"status": (
	"Placeholder repo. Bee Hive is a 3B-class model. Kaggle's "
	"free T4 cannot train 3B with LoRA at useful throughput; this "
	"tier needs paid GPU (Modal, RunPod, Lambda, or HF Inference "
	"Endpoints). No adapters trained yet — compute provisioning "
	"pending. The `training_runs` Postgres table already supports "
	"this tier via `model_id = 'bee-hive'`."
	),
	},
	{
	"name": "cuilabs/bee-swarm",
	"tagline": "Enterprise-grade AI with quantum reasoning.",
	"tier": "Bee Swarm — production tier 4",
	"base_model": "(TBD — 7B+ parameter class)",
	"status": (
	"Placeholder repo. Bee Swarm is a 7B+ class model with "
	"quantum-reasoning routing enabled. Requires H100-class compute. "
	"No adapters trained yet — compute provisioning pending."
	),
	},
	{
	"name": "cuilabs/bee-enclave",
	"tagline": "Private, auditable deployment of any Hive/Swarm workload.",
	"tier": "Bee Enclave — deployment mode (not a separate model)",
	"base_model": "(inherits Hive or Swarm weights at deploy time)",
	"status": (
	"Placeholder repo / deployment artefact. Bee Enclave is "
	"not a separate model tier above Swarm; it is a deployment "
	"mode that wraps Hive/Swarm-class capability inside a private, "
	"auditable boundary (data residency, audit logs, tenant-specific "
	"adapters, PQC transport). This repo will hold tenant-pinned "
	"snapshots of Hive or Swarm adapters once those exist. Billed "
	"per-deployment, not per-token."
	),
	},
	{
	"name": "cuilabs/bee-ignite",
	"tagline": "Experimental Bee-native architecture.",
	"tier": "Bee Ignite — research / R&D",
	"base_model": "(experimental — Bee-native MoE + SSM + custom attention)",
	"status": (
	"Placeholder repo / R&D track. Bee Ignite is the experimental "
	"Bee-native architecture (custom attention, SSM memory, MoE "
	"routing, hierarchical neural compression). Research-only until "
	"benchmark-validated. Hidden from public model menus by default. "
	"No commercial availability."
	),
	},
	]


	def readme_for(r: dict) -> str:
	return f"""---
	license: other
	language:
	- en
	library_name: peft
	pipeline_tag: text-generation
	tags:
	- bee
	- cuilabs
	- lora
	---

	# {r["name"]}

	{r["tagline"]}

	{r["tier"]} — published by [CUI Labs Pte. Ltd.](https://www.cuilabs.io)

	---

	## What this repo holds

	LoRA adapters for the {r["name"].split("/")[1]} tier of the Bee
	Intelligence Engine. Base model: {r["base_model"]}.

	{r["status"]}

	## Branch convention

	`<domain>/<utc-timestamp>`, e.g. `programming/2026-04-28-1430`. The
	`main` branch may be empty until the first successful training run. To
	load a specific domain adapter:

	```python
	from peft import PeftModel
	from transformers import AutoModelForCausalLM, AutoTokenizer

	base = AutoModelForCausalLM.from_pretrained("{r["base_model"]}", torch_dtype="auto")
	tok = AutoTokenizer.from_pretrained("{r["base_model"]}")
	model = PeftModel.from_pretrained(base, "{r["name"]}", revision="programming/2026-04-28-1430")
	```

	## Training transparency

	Every adapter version corresponds to a row in the `training_runs`
	Postgres table on [workspace.bee.cuilabs.io](https://workspace.bee.cuilabs.io)
	with `model_id = "{r["name"].split("/")[1]}"`. Metrics are real loss
	values from the actual run, not estimates. Status is one of
	`completed`, `partial`, or `failed` — partial means the run finished
	cleanly but had nothing to train on yet.

	## License

	Adapter weights: see [CUI Labs licensing](https://www.cuilabs.io). Base
	model weights are governed by their respective upstream licenses.
	"""


	def main() -> None:
	token = os.environ.get("HF_TOKEN")
	if not token:
	raise SystemExit("HF_TOKEN env var required")

	from huggingface_hub import HfApi, create_repo # type: ignore[import-not-found]

	api = HfApi(token=token)
	for r in REPOS:
	print(f"\n=== {r['name']} ===")
	try:
	create_repo(
	r["name"],
	repo_type="model",
	private=True,
	exist_ok=True,
	token=token,
	)
	print(" repo: ok (created or already existed)")
	except Exception as e:
	print(f" repo: ERROR {e!r}")
	continue

	readme = readme_for(r)
	try:
	api.upload_file(
	path_or_fileobj=readme.encode("utf-8"),
	path_in_repo="README.md",
	repo_id=r["name"],
	repo_type="model",
	commit_message="bootstrap: tier-honest README",
	token=token,
	)
	print(f" README: uploaded ({len(readme)} bytes)")
	except Exception as e:
	print(f" README: ERROR {e!r}")


	if __name__ == "__main__":
	main()