Buckets:

bbkdevops
/

unicosys-hypergraph-bucket

Files

xet

bbkdevops/unicosys-hypergraph-bucket / tinymind-native-8b-remote-handoff /bundle /evaluation /resource_optimizer.py

bbkdevops

about 1 month ago

download

raw

4.24 kB

	"""Quality-per-resource optimizer for TinyMind."""

	from __future__ import annotations

	from datetime import datetime, timezone
	import json
	from pathlib import Path


	def _load(path: str \| Path) -> dict:
	return json.loads(Path(path).read_text(encoding="utf-8"))


	def _artifact_mb(path: str \| Path \| None) -> float:
	if not path:
	return 0.0
	p = Path(path)
	return p.stat().st_size / (1024 * 1024) if p.exists() else 0.0


	def score_quality_per_resource(loss: float, bit_error: float, size_mb: float, vram_gb: float) -> float:
	quality = 1.0 / (1.0 + max(loss, 0.0))
	exactness = 1.0 - min(max(bit_error, 0.0), 1.0)
	resource_penalty = 1.0 + (size_mb / 1024.0) + (vram_gb / 24.0)
	return (0.65 * quality + 0.35 * exactness) / resource_penalty


	def build_resource_optimizer_report(
	out_dir: str \| Path,
	bitsharp_report: str \| Path,
	preflight_4b: str \| Path,
	) -> dict:
	bit = _load(bitsharp_report)
	pre = _load(preflight_4b)
	checkpoint = bit.get("checkpoint")
	int4_candidate = "reports/knowledge_full_cycle_sharpen_256_stratified/train_eval/purefield_int4_sparse.pt"
	candidates = [
	{
	"name": "bitsharp_bf16_quality",
	"checkpoint": checkpoint,
	"loss": bit["after"]["loss"],
	"bit_error_proxy": bit["after"]["bit_error_proxy"],
	"size_mb": _artifact_mb(checkpoint),
	"estimated_vram_gb": pre["purefield_vram"]["bf16_weights_gb"],
	"mode": "bf16_or_fp32_checkpoint_quality",
	"training_profile": "microbatch_1_to_2_gradient_checkpointing_bitsharp",
	},
	{
	"name": "int4_sparse_fast_adapter",
	"checkpoint": int4_candidate,
	"loss": bit["after"]["loss"] + 0.05,
	"bit_error_proxy": min(bit["after"]["bit_error_proxy"] + 0.02, 1.0),
	"size_mb": _artifact_mb(int4_candidate),
	"estimated_vram_gb": pre["purefield_vram"]["int4_raw_weights_gb"],
	"mode": "int4_2:4sp_fast",
	"training_profile": "adapter_only_or_bitsharp_delta_then_export_int4",
	},
	]
	for row in candidates:
	row["quality_per_resource_score"] = score_quality_per_resource(
	row["loss"], row["bit_error_proxy"], row["size_mb"], row["estimated_vram_gb"]
	)
	selected = max(candidates, key=lambda row: row["quality_per_resource_score"])
	report = {
	"schema_version": "tinymind-resource-optimizer-v1",
	"created_at": datetime.now(timezone.utc).isoformat(),
	"goal": "maximize measured quality/exactness while minimizing VRAM and artifact size",
	"hardware_target": "RTX 3090 24GB",
	"selected": selected,
	"candidates": candidates,
	"recommended_runtime": {
	"precision_mode": "auto",
	"prefer_int4_sparse_when_quality_gate_passes": True,
	"gradient_checkpointing": True,
	"microbatch": 1,
	"accumulate_grad_batches": 16,
	"train_method": "BitSharp/adapters over PureField/ReGenesis, not full dense 4B Adam",
	},
	"world_best_claim_allowed": False,
	}
	out = Path(out_dir)
	out.mkdir(parents=True, exist_ok=True)
	path = out / "resource_optimizer_report.json"
	md_path = out / "resource_optimizer_report.md"
	report["report_path"] = str(path)
	report["markdown_path"] = str(md_path)
	path.write_text(json.dumps(report, ensure_ascii=False, indent=2, sort_keys=True), encoding="utf-8")
	md_path.write_text(_markdown(report), encoding="utf-8")
	return report


	def _markdown(report: dict) -> str:
	selected = report["selected"]
	lines = [
	"# TinyMind Resource Optimizer",
	"",
	f"- Selected: {selected['name']}",
	f"- Score: {selected['quality_per_resource_score']:.6f}",
	f"- Mode: {selected['mode']}",
	f"- Estimated VRAM GB: {selected['estimated_vram_gb']:.4f}",
	f"- Size MB: {selected['size_mb']:.4f}",
	"- World-best claim allowed: false",
	"",
	"## Recommended Runtime",
	"",
	]
	for key, value in report["recommended_runtime"].items():
	lines.append(f"- {key}: {value}")
	return "\n".join(lines) + "\n"

Xet Storage Details

Size:: 4.24 kB
Xet hash:: 68a73c6ecef7328862c5645ec2cfaa861883d890e2da9239c2d26b04560acee0

Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.