Add various RL adapted configs part 2

2026-01-15 23:41:39 +01:00 · 2024-05-02 11:01:20 +02:00
parent c7c2c4e5a3
commit 175a02f997
1 changed files with 62 additions and 0 deletions
--- a/marl_factory_grid/configs/custom/two_rooms_one_door_modified.yaml
+++ b/marl_factory_grid/configs/custom/two_rooms_one_door_modified.yaml
@@ -0,0 +1,62 @@
+General:
+  env_seed: 69
+  # Individual vs global rewards
+  individual_rewards: true
+  # The level.txt file to load from marl_factory_grid/levels
+  level_name: two_rooms_modified
+  # View Radius; 0 = full observatbility
+  pomdp_r: 0
+  # Print all messages and events
+  verbose: false
+  # Run tests
+  tests: false
+
+# In "two rooms one door" scenario 2 agents spawn in 2 different rooms that are connected by a single door. Their aim
+# is to reach the destination in the room they didn't spawn in leading to a conflict at the door.
+Agents:
+  Wolfgang:
+    Actions:
+      - Move8
+      - DoorUse
+      - Noop
+    Observations:
+      - DirtPiles
+      - Self
+    Positions:
+      - (3,1) # Agent spawnpoint
+  Sigmund:
+    Actions:
+      - Move8
+      - DoorUse
+      - Noop
+    Observations:
+      - DirtPiles
+      - Self
+    Positions:
+      - (3,13)
+
+Entities:
+  DirtPiles:
+    coords_or_quantity: (3,12), (3,2)
+    initial_amount: 0.5 # <1 to ensure that the robot which first attempts to clean this field, can remove the dirt in one action
+    clean_amount: 1
+    dirt_spawn_r_var: 0
+    max_global_amount: 12
+    max_local_amount: 1
+
+  Doors: { }
+
+Rules:
+  # Environment Dynamics
+  DoorAutoClose:
+    close_frequency: 10
+
+  # Utilities
+  # This rule defines the collision mechanic, introduces a related DoneCondition and lets you specify rewards.
+  WatchCollisions:
+    done_at_collisions: false
+
+  # Done Conditions
+  #DoneOnAllDirtCleaned:
+  #DoneAtMaxStepsReached:
+    #max_steps: 100