jacobcd52
/

features_over_time

Model card Files Files and versions

features_over_time / trainer_0 /config.json

jacobcd52's picture

Upload trainer_0/config.json with huggingface_hub

ff79fea verified about 1 year ago

history blame contribute delete

839 Bytes

	{
	"trainer": {
	"trainer_class": "TopKTrainer",
	"dict_class": "AutoEncoderTopK",
	"lr": 0.000282842712474619,
	"steps": 61035,
	"auxk_alpha": 0.03125,
	"warmup_steps": 0,
	"decay_start": null,
	"threshold_beta": 0.999,
	"threshold_start_step": 1000,
	"seed": null,
	"activation_dim": 6144,
	"dict_size": 8192,
	"k": 128,
	"device": "cuda:0",
	"layer": 4,
	"lm_name": "blah",
	"wandb_name": "AutoEncoderTopK",
	"submodule_name": null
	},
	"buffer": {
	"n_models": 12,
	"d_submodule": 512,
	"io": "out",
	"n_ctxs": 1024,
	"ctx_len": 128,
	"refresh_batch_size": 512,
	"out_batch_size": 8192,
	"device": "cuda:0",
	"rescale_acts": true
	}
	}