added own dqn
This commit is contained in:
parent
2432dca173
commit
26d7705e19
@ -146,9 +146,6 @@ class BaseQlearner:
|
||||
rewards = torch.tensor([e.reward for e in experience]).float()
|
||||
dones = torch.tensor([e.done for e in experience]).float()
|
||||
|
||||
print(rewards)
|
||||
|
||||
|
||||
next_q_values = self.target_q_net(next_obs).detach().max(-1)[0]
|
||||
target_q_values = rewards + (1. - dones) * self.gamma * next_q_values
|
||||
|
||||
|
Loading…
x
Reference in New Issue
Block a user