bearlover365
/

multi_sac_smoke

Model card Files Files and versions

multi_sac_smoke / config.json

bearlover365's picture

Upload policy weights, train config and readme

2c061ce verified 5 months ago

history blame contribute delete

3.17 kB

	{
	"type": "sac",
	"n_obs_steps": 1,
	"normalization_mapping": {
	"VISUAL": "MEAN_STD",
	"STATE": "MIN_MAX",
	"ENV": "MIN_MAX",
	"ACTION": "MIN_MAX"
	},
	"input_features": {
	"observation.state": {
	"type": "STATE",
	"shape": [
	6
	]
	}
	},
	"output_features": {
	"action": {
	"type": "ACTION",
	"shape": [
	6
	]
	}
	},
	"device": "cpu",
	"use_amp": false,
	"push_to_hub": true,
	"repo_id": "bearlover365/multi_sac_smoke",
	"private": null,
	"tags": null,
	"license": null,
	"dataset_stats": {
	"observation.image": {
	"mean": [
	0.485,
	0.456,
	0.406
	],
	"std": [
	0.229,
	0.224,
	0.225
	]
	},
	"observation.state": {
	"min": [
	0.0,
	0.0
	],
	"max": [
	1.0,
	1.0
	]
	},
	"action": {
	"min": [
	0.0,
	0.0,
	0.0
	],
	"max": [
	1.0,
	1.0,
	1.0
	]
	}
	},
	"storage_device": "cpu",
	"vision_encoder_name": null,
	"freeze_vision_encoder": true,
	"image_encoder_hidden_dim": 32,
	"shared_encoder": true,
	"num_discrete_actions": null,
	"image_embedding_pooling_dim": 8,
	"online_steps": 1000000,
	"online_env_seed": 10000,
	"online_buffer_capacity": 100000,
	"offline_buffer_capacity": 100000,
	"async_prefetch": false,
	"online_step_before_learning": 100,
	"policy_update_freq": 1,
	"discount": 0.99,
	"temperature_init": 1.0,
	"num_critics": 2,
	"num_subsample_critics": null,
	"critic_lr": 0.0003,
	"actor_lr": 0.0003,
	"temperature_lr": 0.0003,
	"critic_target_update_weight": 0.005,
	"utd_ratio": 1,
	"state_encoder_hidden_dim": 256,
	"latent_dim": 256,
	"target_entropy": null,
	"use_backup_entropy": true,
	"grad_clip_norm": 40.0,
	"critic_network_kwargs": {
	"hidden_dims": [
	256,
	256
	],
	"activate_final": true,
	"final_activation": null
	},
	"actor_network_kwargs": {
	"hidden_dims": [
	256,
	256
	],
	"activate_final": true
	},
	"policy_kwargs": {
	"use_tanh_squash": true,
	"std_min": 1e-05,
	"std_max": 10.0,
	"init_final": 0.05
	},
	"discrete_critic_network_kwargs": {
	"hidden_dims": [
	256,
	256
	],
	"activate_final": true,
	"final_activation": null
	},
	"actor_learner_config": {
	"learner_host": "127.0.0.1",
	"learner_port": 50051,
	"policy_parameters_push_frequency": 4,
	"queue_get_timeout": 2
	},
	"concurrency": {
	"actor": "threads",
	"learner": "threads"
	},
	"use_torch_compile": true
	}