diff --git a/slm_lab/agent/memory/prioritized.py b/slm_lab/agent/memory/prioritized.py index 01f307c2f..610c6e278 100644 --- a/slm_lab/agent/memory/prioritized.py +++ b/slm_lab/agent/memory/prioritized.py @@ -138,7 +138,7 @@ def add_experience(self, state, action, reward, next_state, done, error=100000): def get_priority(self, error): '''Takes in the error of one or more examples and returns the proportional priority''' - p = torch.pow(error + self.epsilon, self.alpha) + p = torch.pow(error.cpu() + self.epsilon, self.alpha) return p.squeeze_().cpu().numpy() def sample_idxs(self, batch_size): diff --git a/slm_lab/experiment/monitor.py b/slm_lab/experiment/monitor.py index 1f138160e..b5c719d79 100644 --- a/slm_lab/experiment/monitor.py +++ b/slm_lab/experiment/monitor.py @@ -81,6 +81,7 @@ class Body: def __init__(self, env, agent_spec, aeb=(0, 0, 0), aeb_space=None): # essential reference variables + self.agent = None # set later self.env = env self.aeb = aeb self.a, self.e, self.b = aeb