From 338a271830c9e411995c63ec6bb0b9d08b3a3e2a Mon Sep 17 00:00:00 2001 From: philtabor Date: Tue, 3 Nov 2020 16:50:03 -0700 Subject: [PATCH] add replace=False --- .../PolicyGradient/DDPG/tensorflow2/pendulum/buffer.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ReinforcementLearning/PolicyGradient/DDPG/tensorflow2/pendulum/buffer.py b/ReinforcementLearning/PolicyGradient/DDPG/tensorflow2/pendulum/buffer.py index beb58bf..096b65b 100644 --- a/ReinforcementLearning/PolicyGradient/DDPG/tensorflow2/pendulum/buffer.py +++ b/ReinforcementLearning/PolicyGradient/DDPG/tensorflow2/pendulum/buffer.py @@ -24,7 +24,7 @@ def store_transition(self, state, action, reward, state_, done): def sample_buffer(self, batch_size): max_mem = min(self.mem_cntr, self.mem_size) - batch = np.random.choice(max_mem, batch_size) + batch = np.random.choice(max_mem, batch_size, replace=False) states = self.state_memory[batch] states_ = self.new_state_memory[batch]