jimjiang203
/

rl4greencrab

Model card Files Files and versions

jimjiang203 commited on Jul 14, 2025

Commit

dbf8752

·

verified ·

1 Parent(s): 37c8108

Upload folder using huggingface_hub

Files changed (17) hide show

PPO_gcmenorm.zip +3 -0
RecurrentPPO_gcmenorm_256_1_varR0.3.zip +3 -0
TD3_gcmenorm.zip +3 -0
TQC_gcmenorm.zip +3 -0
data/.ipynb_checkpoints/ppo_env-checkpoint.csv +0 -0
data/ppo_env.csv +0 -0
data/rppo_env.csv +0 -0
data/td3_env.csv +0 -0
data/tqc_env.csv +0 -0
hyperpars/.ipynb_checkpoints/ppo-gcmnorm-checkpoint.yml +17 -0
hyperpars/.ipynb_checkpoints/rppo-gcmnorm-checkpoint.yml +39 -0
hyperpars/.ipynb_checkpoints/td3-gcmnorm-checkpoint.yml +16 -0
hyperpars/.ipynb_checkpoints/tqc-gcmnorm-checkpoint.yml +17 -0
hyperpars/ppo-gcmnorm.yml +17 -0
hyperpars/rppo-gcmnorm.yml +39 -0
hyperpars/td3-gcmnorm.yml +16 -0
hyperpars/tqc-gcmnorm.yml +17 -0

PPO_gcmenorm.zip ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fe270cc55c5453a6df4b5264b9e6df4f615c4195787b73ed22635c5b0a2bec7a
+size 163250

RecurrentPPO_gcmenorm_256_1_varR0.3.zip ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e3f9a33cc90f5c296eff51cdc9128e2dbfccd87788f913c2fd9e2fa09d1b9ab6
+size 9897589

TD3_gcmenorm.zip ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:061f6dc479bb3ff315fbd895bafa2dbcb82d275aace8a88381c1c41aeac51003
+size 6171693

TQC_gcmenorm.zip ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7eaa1c0c21ac455d5493f0f18d6fe439822e033398d7fa3e2938e128ae474396
+size 3362137

data/.ipynb_checkpoints/ppo_env-checkpoint.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

data/ppo_env.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

data/rppo_env.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

data/td3_env.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

data/tqc_env.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

hyperpars/.ipynb_checkpoints/ppo-gcmnorm-checkpoint.yml ADDED Viewed

	@@ -0,0 +1,17 @@

+algo: "PPO"
+policy: "MultiInputPolicy"
+env_id: "monthenvnorm"
+n_envs: 12
+tensorboard: "/home/rstudio/logs"
+total_timesteps: 10000000
+config:
+    "w_mort_scale" : 600
+    "growth_k": 0.70
+    'random_start': True
+    "curriculum": False
+    'var_penalty_const': 0
+use_sde: False
+id: "1"
+repo: "cboettig/rl4geco"
+save_path: "/home/rstudio/rl4greencrab/saved_agents"
+progress_bar: True

hyperpars/.ipynb_checkpoints/rppo-gcmnorm-checkpoint.yml ADDED Viewed

	@@ -0,0 +1,39 @@

+algo: 'RecurrentPPO'
+policy: "MultiInputLstmPolicy"
+env_id: "monthenvnorm"
+n_envs: 12
+tensorboard: "/home/rstudio/logs"
+total_timesteps: 15000000
+config:
+    "w_mort_scale" : 600
+    "growth_k": 0.70
+    'random_start': True
+    "curriculum": False
+    'var_penalty_const': 0.3
+model_config:
+    'verbose': 0
+    'normalize_advantage': True
+    'batch_size': 256,
+    'n_steps': 1024,
+    'gamma': 0.9999,
+    'learning_rate': 0.0003,
+    'ent_coef': 0.00429,
+    'clip_range': 0.1,
+    'n_epochs': 10,
+    'gae_lambda': 0.9,
+    'max_grad_norm': 0.5,
+    'vf_coef': 0.19,
+    'use_sde': False
+    'sde_sample_freq': 8
+    'tensorboard_log': "/home/rstudio/logs"
+    'policy_kwargs': dict(log_std_init=0.0,
+                          ortho_init=False,
+                       lstm_hidden_size=256,
+                       n_lstm_layers = 1,
+                       enable_critic_lstm=True,
+                       activation_fn=nn.ReLU,
+                       net_arch=dict(pi=[256, 256], vf=[256, 256]))
+id: "1"
+repo: "cboettig/rl4geco"
+save_path: "/home/rstudio/rl4greencrab/saved_agents"
+progress_bar: True

hyperpars/.ipynb_checkpoints/td3-gcmnorm-checkpoint.yml ADDED Viewed

	@@ -0,0 +1,16 @@

+algo: "TD3"
+policy: "MultiInputPolicy"
+env_id: "monthenvnorm"
+n_envs: 12
+tensorboard: "/home/rstudio/logs"
+total_timesteps: 10000000
+config:
+    "w_mort_scale" : 600
+    "growth_k": 0.70
+    'random_start': True
+    "curriculum": False
+    'var_penalty_const': 0
+id: "1"
+repo: "cboettig/rl4geco"
+save_path: "/home/rstudio/rl4greencrab/saved_agents"
+progress_bar: True

hyperpars/.ipynb_checkpoints/tqc-gcmnorm-checkpoint.yml ADDED Viewed

	@@ -0,0 +1,17 @@

+algo: "TQC"
+policy: "MultiInputPolicy"
+env_id: "monthenvnorm"
+n_envs: 12
+tensorboard: "/home/rstudio/logs"
+total_timesteps: 10000000
+config:
+    "w_mort_scale" : 600
+    "growth_k": 0.70
+    'random_start': True
+    "curriculum": False
+    'var_penalty_const': 0.3
+use_sde: False
+id: "1"
+repo: "cboettig/rl4geco"
+save_path: "/home/rstudio/rl4greencrab/saved_agents"
+progress_bar: True

hyperpars/ppo-gcmnorm.yml ADDED Viewed

	@@ -0,0 +1,17 @@

+algo: "PPO"
+policy: "MultiInputPolicy"
+env_id: "monthenvnorm"
+n_envs: 12
+tensorboard: "/home/rstudio/logs"
+total_timesteps: 10000000
+config:
+    "w_mort_scale" : 600
+    "growth_k": 0.70
+    'random_start': True
+    "curriculum": False
+    'var_penalty_const': 0
+use_sde: False
+id: "1"
+repo: "cboettig/rl4geco"
+save_path: "/home/rstudio/rl4greencrab/saved_agents"
+progress_bar: True

hyperpars/rppo-gcmnorm.yml ADDED Viewed

	@@ -0,0 +1,39 @@

+algo: 'RecurrentPPO'
+policy: "MultiInputLstmPolicy"
+env_id: "monthenvnorm"
+n_envs: 12
+tensorboard: "/home/rstudio/logs"
+total_timesteps: 15000000
+config:
+    "w_mort_scale" : 600
+    "growth_k": 0.70
+    'random_start': True
+    "curriculum": False
+    'var_penalty_const': 0.3
+model_config:
+    'verbose': 0
+    'normalize_advantage': True
+    'batch_size': 256,
+    'n_steps': 1024,
+    'gamma': 0.9999,
+    'learning_rate': 0.0003,
+    'ent_coef': 0.00429,
+    'clip_range': 0.1,
+    'n_epochs': 10,
+    'gae_lambda': 0.9,
+    'max_grad_norm': 0.5,
+    'vf_coef': 0.19,
+    'use_sde': False
+    'sde_sample_freq': 8
+    'tensorboard_log': "/home/rstudio/logs"
+    'policy_kwargs': dict(log_std_init=0.0,
+                          ortho_init=False,
+                       lstm_hidden_size=256,
+                       n_lstm_layers = 1,
+                       enable_critic_lstm=True,
+                       activation_fn=nn.ReLU,
+                       net_arch=dict(pi=[256, 256], vf=[256, 256]))
+id: "1"
+repo: "cboettig/rl4geco"
+save_path: "/home/rstudio/rl4greencrab/saved_agents"
+progress_bar: True

hyperpars/td3-gcmnorm.yml ADDED Viewed

	@@ -0,0 +1,16 @@

+algo: "TD3"
+policy: "MultiInputPolicy"
+env_id: "monthenvnorm"
+n_envs: 12
+tensorboard: "/home/rstudio/logs"
+total_timesteps: 10000000
+config:
+    "w_mort_scale" : 600
+    "growth_k": 0.70
+    'random_start': True
+    "curriculum": False
+    'var_penalty_const': 0
+id: "1"
+repo: "cboettig/rl4geco"
+save_path: "/home/rstudio/rl4greencrab/saved_agents"
+progress_bar: True

hyperpars/tqc-gcmnorm.yml ADDED Viewed

	@@ -0,0 +1,17 @@

+algo: "TQC"
+policy: "MultiInputPolicy"
+env_id: "monthenvnorm"
+n_envs: 12
+tensorboard: "/home/rstudio/logs"
+total_timesteps: 10000000
+config:
+    "w_mort_scale" : 600
+    "growth_k": 0.70
+    'random_start': True
+    "curriculum": False
+    'var_penalty_const': 0.3
+use_sde: False
+id: "1"
+repo: "cboettig/rl4geco"
+save_path: "/home/rstudio/rl4greencrab/saved_agents"
+progress_bar: True