Skip to content

Commit 228706f

Browse files
committed
feat (zym): update ppo config to support discrete action space
feat (zym): update ppo config to support discrete action space
1 parent 888acd6 commit 228706f

File tree

3 files changed

+0
-7
lines changed

3 files changed

+0
-7
lines changed

dizoo/atari/config/serial/enduro/enduro_onppo_config.py

-5
Original file line numberDiff line numberDiff line change
@@ -29,7 +29,6 @@
2929
learn=dict(
3030
lr_scheduler=dict(epoch_num=5200, min_lr_lambda=0),
3131
epoch_per_collect=4,
32-
update_per_collect=1,
3332
batch_size=256,
3433
learning_rate=2.5e-4,
3534
value_weight=0.5,
@@ -54,10 +53,6 @@
5453
discount_factor=0.99,
5554
),
5655
eval=dict(evaluator=dict(eval_freq=5000, )),
57-
# other=dict(replay_buffer=dict(
58-
# replay_buffer_size=10000,
59-
# max_use=3,
60-
# ), ),
6156
),
6257
)
6358
main_config = EasyDict(enduro_onppo_config)

dizoo/atari/config/serial/qbert/qbert_onppo_config.py

-1
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,6 @@
2828
learn=dict(
2929
lr_scheduler=dict(epoch_num=5200, min_lr_lambda=0),
3030
epoch_per_collect=4,
31-
update_per_collect=1,
3231
batch_size=256,
3332
learning_rate=2.5e-4,
3433
value_weight=0.5,

dizoo/atari/config/serial/spaceinvaders/spaceinvaders_onppo_config.py

-1
Original file line numberDiff line numberDiff line change
@@ -30,7 +30,6 @@
3030
learn=dict(
3131
lr_scheduler=dict(epoch_num=5200, min_lr_lambda=0),
3232
epoch_per_collect=4,
33-
update_per_collect=1,
3433
batch_size=256,
3534
learning_rate=2.5e-4,
3635
value_weight=0.5,

0 commit comments

Comments
 (0)