programasweights
/

paw-4b-gpt2

Text Generation

program-as-weights

Model card Files Files and versions

paw-4b-gpt2 / meta.json

yuntian-deng's picture

Upload folder using huggingface_hub

60f07dd verified 1 day ago

history blame contribute delete

601 Bytes

	{
	"opt_step": 210751,
	"timestamp": 1775400448.2125497,
	"compiler_model": "train_runs/big_run_gpt2.latest/compiler",
	"interpreter_model": "gpt2",
	"freeze_interpreter": true,
	"freeze_compiler": true,
	"reward_type": "gt_logprob",
	"prefix_steps": 64,
	"prefix_loss_coef": 1.0,
	"compiler_rollout_reg_coef": 0.0,
	"compiler_prompt_style": "minimal",
	"num_rollouts": 1,
	"debug_overfit_one": false,
	"debug_example_idx": 0,
	"debug_overfit_n": 0,
	"lora_rank": 64,
	"lora_alpha": 16.0,
	"lora_target_modules": [
	"c_attn",
	"c_proj",
	"c_fc"
	],
	"lora_num_bases": 64
	}