diff --git a/controllers/mat_train/runner/soccer_runner.py b/controllers/mat_train/runner/soccer_runner.py index 427dfdb..a861b32 100644 --- a/controllers/mat_train/runner/soccer_runner.py +++ b/controllers/mat_train/runner/soccer_runner.py @@ -101,7 +101,6 @@ def run(self): self.log_train(train_infos, total_num_steps) num = self.episode_length * self.log_interval - print("rewards: {}".format(sum_episode_rewards[0]/num)) self.writter.add_scalars("train_episode_rewards", {"total_rewards": sum_episode_rewards[0]/num}, total_num_steps) sum_episode_rewards = [0 for _ in range(self.n_rollout_threads)] self.writter.add_scalars("train_episode_rewards", {"ball_distance_reward": sum_ball_distance_reward[0]/self.num_agents/num}, total_num_steps) diff --git a/controllers/mat_train/soccer/soccer.py b/controllers/mat_train/soccer/soccer.py index f083559..b1c8493 100644 --- a/controllers/mat_train/soccer/soccer.py +++ b/controllers/mat_train/soccer/soccer.py @@ -188,7 +188,7 @@ def step(self, action): velocity_reward = 10.0 out_of_field_reward = -100.0 collision_reward = -1.0 - ball_position_reward = 2.0 + ball_position_reward = 4.0 ball_tracking_reward = 0.1 rew_ball_distance = dict(zip(self.agents, [0.0 for _ in self.agents]))