2 agents running

2021-05-18 17:13:56 +02:00
parent 05c54ad8d8
commit c1f2ddf3cd
2 changed files with 8 additions and 5 deletions
--- a/environments/factory/simple_factory_getting_dirty.py
+++ b/environments/factory/simple_factory_getting_dirty.py
@@ -106,7 +106,10 @@ class GettingDirty(BaseFactory):
        current_dirt_amount = self.state[DIRT_INDEX].sum()
        dirty_tiles = len(np.nonzero(self.state[DIRT_INDEX]))

-        this_step_reward = -(dirty_tiles / current_dirt_amount)
+        try:
+            this_step_reward = -(dirty_tiles / current_dirt_amount)
+        except ZeroDivisionError:
+            this_step_reward = 0

        for agent_state in agent_states:
            collisions = agent_state.collisions
@@ -127,10 +130,10 @@ if __name__ == '__main__':
    render = True

    dirt_props = DirtProperties()
-    factory = GettingDirty(n_agents=1, dirt_properties=dirt_props)
+    factory = GettingDirty(n_agents=2, dirt_properties=dirt_props)
    monitor_list = list()
    for epoch in range(100):
-        random_actions = [random.randint(0, 8) for _ in range(200)]
+        random_actions = [(random.randint(0, 8), random.randint(0, 8)) for _ in range(200)]
        env_state, reward, done_bool, _ = factory.reset()
        for agent_i_action in random_actions:
            env_state, reward, done_bool, info_obj = factory.step(agent_i_action)