mirror of
				https://github.com/illiumst/marl-factory-grid.git
				synced 2025-10-31 12:37:27 +01:00 
			
		
		
		
	added own dqn
This commit is contained in:
		| @@ -146,9 +146,6 @@ class BaseQlearner: | ||||
|             rewards = torch.tensor([e.reward for e in experience]).float() | ||||
|             dones = torch.tensor([e.done for e in experience]).float() | ||||
|  | ||||
|             print(rewards) | ||||
|  | ||||
|  | ||||
|             next_q_values = self.target_q_net(next_obs).detach().max(-1)[0] | ||||
|             target_q_values = rewards + (1. - dones) * self.gamma * next_q_values | ||||
|  | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 romue
					romue