diff --git a/algorithms/_base.py b/algorithms/_base.py index 19652f3..15637c8 100644 --- a/algorithms/_base.py +++ b/algorithms/_base.py @@ -146,9 +146,6 @@ class BaseQlearner: rewards = torch.tensor([e.reward for e in experience]).float() dones = torch.tensor([e.done for e in experience]).float() - print(rewards) - - next_q_values = self.target_q_net(next_obs).detach().max(-1)[0] target_q_values = rewards + (1. - dones) * self.gamma * next_q_values