Spaces:

Ramkan7
/

Patch_Hawk

Running

Patch_Hawk / .env.example

Revised Flow

72bc633 about 2 months ago

1.38 kB

	# PatchHawk Environment Configuration
	# Copy this file to .env and fill in your real values.

	# ── Models ────────────────────────────────────────────────────────
	# Model for synthetic data generation (Meta SDK Track A)
	SYNTH_GENERATOR_MODEL=meta-llama/Llama-3.2-3B-Instruct

	# Base policy model for GRPO training
	GRPO_POLICY_MODEL=unsloth/Qwen2.5-Coder-7B-Instruct

	# ── Weights & Biases ─────────────────────────────────────────────
	WANDB_API_KEY=your_wandb_api_key_here
	WANDB_PROJECT=patchhawk
	WANDB_RUN_NAME=grpo-run-1

	# ── Hugging Face Hub ─────────────────────────────────────────────
	HF_TOKEN=your_hf_token_here
	HF_REPO=your-username/patchhawk

	# ── Docker ────────────────────────────────────────────────────────
	DOCKER_IMAGE=patchhawk-sandbox:latest

	# ── vLLM (Track A SDK) ──────────────────────────────────────────
	VLLM_API_BASE=http://localhost:8000/v1