Skip to content

Commit

Permalink
Merge branch 'main' into Niki
Browse files Browse the repository at this point in the history
  • Loading branch information
nicolalove committed Jun 7, 2024
2 parents 7356744 + b394d00 commit bf9d6dd
Show file tree
Hide file tree
Showing 9 changed files with 2,998 additions and 197 deletions.
38 changes: 37 additions & 1 deletion hyperpars/ppo-caribou.yml
Original file line number Diff line number Diff line change
@@ -1,9 +1,43 @@
# stable-baselines3 configuration

# algo: "PPO"
# env_id: "CaribouScipy"
# config: {}
# n_envs: 12
# tensorboard: "../../../logs"
# total_timesteps: 1000000
# use_sde: True
# repo: "boettiger-lab/rl4eco"
# save_path: "../saved_agents"
# id: "3"

algo: "PPO"
total_timesteps: 5000000
algo_config:
tensorboard_log: "../../../logs"
#
policy: 'MlpPolicy'
# batch_size: 512
# gamma: 0.9999
# learning_rate: !!float 7.77e-05
# ent_coef: 0.00429
# clip_range: 0.1
# gae_lambda: 0.9
# max_grad_norm: 5
# vf_coef: 0.19
# use_sde: True
# policy_kwargs: "dict(log_std_init=-3.29, ortho_init=False, net_arch=[256, 128])"
# in policy_kwargs: net_arch=[400, 300]
# policy: 'MlpPolicy'
# use_sde: True
# policy_kwargs: "dict(log_std_init=-3, net_arch=[400, 300])"
# clip_range: 0.1

# env
env_id: "CaribouScipy"
config: {"r_b":.25 } #this is what is passed into the creation of the environment, could pass diff param values here to change the defaults (instead of messing with the params defined in caribou_ode.py)
n_envs: 12

tensorboard: "/home/rstudio/logs"
#total_timesteps: 50000
total_timesteps: 5000000
Expand All @@ -13,4 +47,6 @@ save_path: "./saved_agents"
id: "3"
#rppo - ppo that has memory (should be better than PPO but hard to train lol)
#td3 - giving some weird errors
#tqc is actually better if we can give it enough time to run
#tqc is actually better if we can give it enough time to run
# misc
additional_imports: ["torch"]
47 changes: 41 additions & 6 deletions hyperpars/tqc-caribou.yml
Original file line number Diff line number Diff line change
@@ -1,12 +1,47 @@
# stable-baselines3 configuration

# algo: "TQC"
# env_id: "CaribouScipy"
# n_envs: 12
# tensorboard: "/home/rstudio/logs"
# total_timesteps: 500000
# config: {}
# use_sde: True
# repo: "boettiger-lab/rl4eco"
# save_path: "../saved_agents"
# id: "2"

algo: "TQC"
total_timesteps: 5000000
algo_config:
tensorboard_log: "../../../logs"
#
policy: 'MlpPolicy'
# batch_size: 512
# gamma: 0.9999
# learning_rate: !!float 7.77e-05
# ent_coef: 0.00429
# clip_range: 0.1
# gae_lambda: 0.9
# max_grad_norm: 5
# vf_coef: 0.19
# use_sde: True
# policy_kwargs: "dict(log_std_init=-3.29, ortho_init=False, net_arch=[256, 128])"
# in policy_kwargs: net_arch=[400, 300]
# policy: 'MlpPolicy'
# use_sde: True
# policy_kwargs: "dict(log_std_init=-3, net_arch=[400, 300])"
# clip_range: 0.1

# env
env_id: "CaribouScipy"
n_envs: 12
tensorboard: "/home/rstudio/logs"
total_timesteps: 500000
config: {}
use_sde: True
repo: "boettiger-lab/rl4eco"
n_envs: 12

# io
repo: "cboettig/rl-ecology"
save_path: "../saved_agents"
id: "2"

# misc
# id: ""
additional_imports: ["torch"]
Loading

0 comments on commit bf9d6dd

Please sign in to comment.