added own dqn
This commit is contained in:
parent
2432dca173
commit
26d7705e19
@ -146,9 +146,6 @@ class BaseQlearner:
|
|||||||
rewards = torch.tensor([e.reward for e in experience]).float()
|
rewards = torch.tensor([e.reward for e in experience]).float()
|
||||||
dones = torch.tensor([e.done for e in experience]).float()
|
dones = torch.tensor([e.done for e in experience]).float()
|
||||||
|
|
||||||
print(rewards)
|
|
||||||
|
|
||||||
|
|
||||||
next_q_values = self.target_q_net(next_obs).detach().max(-1)[0]
|
next_q_values = self.target_q_net(next_obs).detach().max(-1)[0]
|
||||||
target_q_values = rewards + (1. - dones) * self.gamma * next_q_values
|
target_q_values = rewards + (1. - dones) * self.gamma * next_q_values
|
||||||
|
|
||||||
|
Loading…
x
Reference in New Issue
Block a user