ruhrpott
/

FB-Point-Mass-Maze-12M

Model card Files Files and versions

FB-Point-Mass-Maze-12M / checkpoint /config.json

ruhrpott's picture

Upload 4 files

fd53424 verified 6 months ago

history blame contribute delete

1.77 kB

	{
	"model": {
	"obs_dim": 4,
	"action_dim": 2,
	"device": "cuda",
	"archi": {
	"z_dim": 100,
	"norm_z": true,
	"f": {
	"hidden_dim": 1024,
	"model": "simple",
	"hidden_layers": 1,
	"embedding_layers": 2,
	"num_parallel": 2,
	"ensemble_mode": "batch"
	},
	"b": {
	"hidden_dim": 256,
	"hidden_layers": 2,
	"norm": true
	},
	"actor": {
	"hidden_dim": 1024,
	"model": "simple",
	"hidden_layers": 1,
	"embedding_layers": 2,
	"learn_std": false,
	"per_state_std": false,
	"squash": false
	},
	"critic": {
	"hidden_dim": 1024,
	"hidden_layers": 1,
	"embedding_layers": 2,
	"num_parallel": 2,
	"ensemble_mode": "batch"
	}
	},
	"inference_batch_size": 500000,
	"seq_length": 1,
	"actor_std": 0.2,
	"norm_obs": false
	},
	"train": {
	"lr_f": 0.0001,
	"lr_b": 1e-06,
	"lr_actor": 1e-06,
	"weight_decay": 0.0,
	"clip_grad_norm": 0.0,
	"fb_target_tau": 0.01,
	"ortho_coef": 1.0,
	"train_goal_ratio": 0.5,
	"fb_pessimism_penalty": 0.0,
	"actor_pessimism_penalty": 0,
	"stddev_clip": 0.3,
	"q_loss_coef": 0.0,
	"batch_size": 1024,
	"discount": 0.99,
	"update_z_every_step": 150,
	"z_buffer_size": 10000,
	"h_coef": 1.0
	},
	"cudagraphs": true,
	"compile": true
	}