mirror of
https://github.com/illiumst/marl-factory-grid.git
synced 2025-06-18 10:42:53 +02:00
cleanup algos + adjusted renderer to support "ray casting"
This commit is contained in:
@ -25,7 +25,7 @@ class MQLearner(QLearner):
|
||||
if len(self.buffer) < self.batch_size: return
|
||||
for _ in range(self.n_grad_steps):
|
||||
|
||||
experience = self.buffer.sample(self.batch_size, cer=self.train_every_n_steps)
|
||||
experience = self.buffer.sample(self.batch_size, cer=self.train_every[-1])
|
||||
|
||||
with torch.no_grad():
|
||||
q_target_next = self.target_q_net(experience.next_observation)
|
||||
|
Reference in New Issue
Block a user