{ "project": "CyberCoder-7B-v1", "description": "Cybersecurity-focused code model with structured JSON output", "architecture_decisions": { "base_model": { "choice": "Qwen/Qwen2.5-Coder-7B-Instruct", "rationale": "SOTA open code model at 7B scale. Strong on HumanEval, MBPP, LiveCodeBench. Apache 2.0 license." }, "training_method": { "choice": "SFT with LoRA (r=64, alpha=128)", "rationale": "CyberPal 2.0 recipe. LoRA allows training on single A10G/A100.", "hyperparameters": { "learning_rate": 4e-5, "warmup_ratio": 0.15, "num_epochs": 2, "max_seq_length": 4096, "batch_size_effective": 16, "optimizer": "AdamW", "scheduler": "cosine" } } }, "scaling_roadmap": { "phase_1": "7B LoRA SFT (current) - $4-16, 2-4hrs on A10G", "phase_2": "7B full SFT with 200K+ examples - $32-64, 12-24hrs on A100", "phase_3": "32B LoRA SFT - $192-768, 24-48hrs on 8xA100", "phase_4": "100B+ sparse MoE (frontier) - $5-50M, 2-4 months on 1000+ H100s" }, "research_references": [ {"paper": "CyberPal 2.0", "arxiv": "2510.14113"}, {"paper": "Foundation-Sec-8B", "arxiv": "2504.21039"}, {"paper": "SWE-Master", "arxiv": "2602.03411"}, {"paper": "RL-Struct (JSON output)", "arxiv": "2512.00319"}, {"paper": "DeepSeek-V3", "arxiv": "2412.19437"} ] }