From f97e82a5512279337704e211151c91013cfdd1bc Mon Sep 17 00:00:00 2001 From: Tarun Date: Sat, 25 Jul 2020 14:06:34 +0100 Subject: [PATCH] updated config --- common/experience.py | 2 +- configs/whirl_baselines/iql_MMM2.yaml | 6 +++--- configs/whirl_baselines/vdn_3s5z_vs_3s6z.yaml | 4 ++-- configs/whirl_baselines/vdn_3s_vs_5z.yaml | 4 ++-- configs/whirl_baselines/vdn_MMM2.yaml | 2 +- 5 files changed, 9 insertions(+), 9 deletions(-) diff --git a/common/experience.py b/common/experience.py index 77f01960..12ac0fc5 100644 --- a/common/experience.py +++ b/common/experience.py @@ -40,7 +40,7 @@ def add(self, obs_t, action, state_t, reward, obs_tp1, done): self._states[self._next_idx] = state_t self._next_idx = (self._next_idx + 1) % self._maxsize - print(self._curr_size) + # print(self._curr_size) def _get(self, idx): return self._obses[idx], self._actions[idx], self._states[idx], self._rewards[idx], self._next_obses[idx], self._dones[idx] diff --git a/configs/whirl_baselines/iql_MMM2.yaml b/configs/whirl_baselines/iql_MMM2.yaml index 788c0961..98baf82d 100644 --- a/configs/whirl_baselines/iql_MMM2.yaml +++ b/configs/whirl_baselines/iql_MMM2.yaml @@ -51,7 +51,7 @@ params: gamma: 0.99 learning_rate: 0.0005 steps_per_epoch: 10 - batch_size: 2 + batch_size: 64 epsilon: 1.0 min_epsilon: 0.05 epsilon_decay_frames: 100000 @@ -60,14 +60,14 @@ params: name: MMM2 is_double: True score_to_win: 20 - num_steps_fill_buffer: 10 + num_steps_fill_buffer: 10000 replay_buffer_type: 'normal' replay_buffer_size: 1000000 priority_beta: 0.4 priority_alpha: 0.6 beta_decay_frames: 100000 max_beta: 1 - steps_num: 1 + steps_num: 10 # episodes_to_log: 10 atoms_num: 1 games_to_track: 20 diff --git a/configs/whirl_baselines/vdn_3s5z_vs_3s6z.yaml b/configs/whirl_baselines/vdn_3s5z_vs_3s6z.yaml index 0ddd4c9b..86b0e2e1 100644 --- a/configs/whirl_baselines/vdn_3s5z_vs_3s6z.yaml +++ b/configs/whirl_baselines/vdn_3s5z_vs_3s6z.yaml @@ -57,10 +57,10 @@ params: epsilon_decay_frames: 100000 num_epochs_to_copy: 10000 env_name: smac_cnn - name: 3s5z_vs_3s6z + name: MMM2 is_double: True score_to_win: 20 - num_steps_fill_buffer: 100000 + num_steps_fill_buffer: 10000 replay_buffer_type: 'normal' replay_buffer_size: 1000000 priority_beta: 0.4 diff --git a/configs/whirl_baselines/vdn_3s_vs_5z.yaml b/configs/whirl_baselines/vdn_3s_vs_5z.yaml index 16818698..8f2acb93 100644 --- a/configs/whirl_baselines/vdn_3s_vs_5z.yaml +++ b/configs/whirl_baselines/vdn_3s_vs_5z.yaml @@ -57,10 +57,10 @@ params: epsilon_decay_frames: 100000 num_epochs_to_copy: 10000 env_name: smac_cnn - name: 3s_vs_5z + name: MMM2 is_double: True score_to_win: 20 - num_steps_fill_buffer: 100000 + num_steps_fill_buffer: 10000 replay_buffer_type: 'normal' replay_buffer_size: 1000000 priority_beta: 0.4 diff --git a/configs/whirl_baselines/vdn_MMM2.yaml b/configs/whirl_baselines/vdn_MMM2.yaml index 2730c1a6..de98b7f6 100644 --- a/configs/whirl_baselines/vdn_MMM2.yaml +++ b/configs/whirl_baselines/vdn_MMM2.yaml @@ -60,7 +60,7 @@ params: name: MMM2 is_double: True score_to_win: 20 - num_steps_fill_buffer: 1000 + num_steps_fill_buffer: 10000 replay_buffer_type: 'normal' replay_buffer_size: 1000000 priority_beta: 0.4