Skip to content

Commit 1ac9ad5

Browse files
committed
config(nyz): fix masac smac config multi_agent=True bug (#791)
1 parent 96c4955 commit 1ac9ad5

11 files changed

+15
-16
lines changed

dizoo/smac/config/smac_10m11m_masac_config.py

+2-3
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,7 @@
2626
),
2727
policy=dict(
2828
cuda=True,
29-
on_policy=False,
29+
multi_agent=True,
3030
random_collect_size=0,
3131
model=dict(
3232
agent_obs_shape=132,
@@ -52,7 +52,6 @@
5252
collect=dict(
5353
env_num=collector_env_num,
5454
n_sample=1600,
55-
unroll_len=1,
5655
),
5756
command=dict(),
5857
eval=dict(
@@ -88,4 +87,4 @@
8887
if __name__ == '__main__':
8988

9089
from ding.entry import serial_pipeline
91-
serial_pipeline((main_config, create_config), seed=0)
90+
serial_pipeline((main_config, create_config), seed=0, max_env_step=int(1e7))

dizoo/smac/config/smac_25m_masac_config.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,7 @@
2626
),
2727
policy=dict(
2828
cuda=True,
29-
on_policy=False,
29+
multi_agent=True,
3030
random_collect_size=0,
3131
model=dict(
3232
agent_obs_shape=306,

dizoo/smac/config/smac_2c64zg_masac_config.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,7 @@
2626
),
2727
policy=dict(
2828
cuda=True,
29-
on_policy=False,
29+
multi_agent=True,
3030
random_collect_size=0,
3131
model=dict(
3232
agent_obs_shape=404,

dizoo/smac/config/smac_3m_masac_config.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -26,6 +26,7 @@
2626
),
2727
policy=dict(
2828
cuda=True,
29+
multi_agent=True,
2930
random_collect_size=0,
3031
model=dict(
3132
agent_obs_shape=42,
@@ -41,7 +42,6 @@
4142
learning_rate_q=5e-4,
4243
learning_rate_policy=5e-4,
4344
learning_rate_alpha=5e-4,
44-
ignore_done=False,
4545
target_theta=0.005,
4646
discount_factor=0.99,
4747
alpha=0.2,
@@ -63,7 +63,7 @@
6363
start=1,
6464
end=0.05,
6565
decay=100000,
66-
), # TODO(pu)
66+
),
6767
replay_buffer=dict(replay_buffer_size=1000000, ),
6868
),
6969
),

dizoo/smac/config/smac_3s5z_masac_config.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -26,6 +26,7 @@
2626
),
2727
policy=dict(
2828
cuda=True,
29+
multi_agent=True,
2930
random_collect_size=0,
3031
model=dict(
3132
agent_obs_shape=150,
@@ -41,7 +42,6 @@
4142
learning_rate_q=5e-4,
4243
learning_rate_policy=5e-4,
4344
learning_rate_alpha=5e-5,
44-
ignore_done=False,
4545
target_theta=0.005,
4646
discount_factor=0.99,
4747
alpha=0.2,

dizoo/smac/config/smac_3s5zvs3s6z_masac_config.py

+2-3
Original file line numberDiff line numberDiff line change
@@ -19,15 +19,14 @@
1919
stop_value=0.99,
2020
death_mask=True,
2121
special_global_state=special_global_state,
22-
# save_replay_episodes = 1,
2322
manager=dict(
2423
shared_memory=False,
2524
reset_timeout=6000,
2625
),
2726
),
2827
policy=dict(
2928
cuda=True,
30-
on_policy=False,
29+
multi_agent=True,
3130
random_collect_size=0,
3231
model=dict(
3332
agent_obs_shape=159,
@@ -89,4 +88,4 @@
8988
if __name__ == '__main__':
9089

9190
from ding.entry import serial_pipeline
92-
serial_pipeline((main_config, create_config), seed=0)
91+
serial_pipeline((main_config, create_config), seed=0, max_env_step=int(1e7))

dizoo/smac/config/smac_5m6m_masac_config.py

+1
Original file line numberDiff line numberDiff line change
@@ -26,6 +26,7 @@
2626
),
2727
policy=dict(
2828
cuda=True,
29+
multi_agent=True,
2930
random_collect_size=0,
3031
model=dict(
3132
agent_obs_shape=72,

dizoo/smac/config/smac_8m9m_masac_config.py

+1-2
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,4 @@
11
from easydict import EasyDict
2-
from ding.entry import serial_pipeline
32

43
agent_num = 8
54
collector_env_num = 8
@@ -27,7 +26,7 @@
2726
),
2827
policy=dict(
2928
cuda=True,
30-
on_policy=False,
29+
multi_agent=True,
3130
random_collect_size=0,
3231
model=dict(
3332
agent_obs_shape=108,

dizoo/smac/config/smac_MMM2_masac_config.py

+1
Original file line numberDiff line numberDiff line change
@@ -26,6 +26,7 @@
2626
),
2727
policy=dict(
2828
cuda=True,
29+
multi_agent=True,
2930
random_collect_size=0,
3031
model=dict(
3132
agent_obs_shape=204,

dizoo/smac/config/smac_MMM_masac_config.py

+1
Original file line numberDiff line numberDiff line change
@@ -26,6 +26,7 @@
2626
),
2727
policy=dict(
2828
cuda=True,
29+
multi_agent=True,
2930
random_collect_size=0,
3031
model=dict(
3132
agent_obs_shape=186,

dizoo/smac/config/smac_corridor_masac_config.py

+2-3
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,4 @@
11
from easydict import EasyDict
2-
from ding.entry import serial_pipeline
32

43
agent_num = 6
54
collector_env_num = 8
@@ -27,7 +26,7 @@
2726
),
2827
policy=dict(
2928
cuda=True,
30-
on_policy=False,
29+
multi_agent=True,
3130
random_collect_size=0,
3231
model=dict(
3332
agent_obs_shape=192,
@@ -89,4 +88,4 @@
8988
if __name__ == '__main__':
9089

9190
from ding.entry import serial_pipeline
92-
serial_pipeline((main_config, create_config), seed=0)
91+
serial_pipeline((main_config, create_config), seed=0, max_env_step=int(1e7))

0 commit comments

Comments
 (0)