Add various RL adapted configs part 2

This commit is contained in:
Julian Schönberger
2024-05-02 11:01:20 +02:00
parent c7c2c4e5a3
commit 175a02f997

View File

@ -0,0 +1,62 @@
General:
env_seed: 69
# Individual vs global rewards
individual_rewards: true
# The level.txt file to load from marl_factory_grid/levels
level_name: two_rooms_modified
# View Radius; 0 = full observatbility
pomdp_r: 0
# Print all messages and events
verbose: false
# Run tests
tests: false
# In "two rooms one door" scenario 2 agents spawn in 2 different rooms that are connected by a single door. Their aim
# is to reach the destination in the room they didn't spawn in leading to a conflict at the door.
Agents:
Wolfgang:
Actions:
- Move8
- DoorUse
- Noop
Observations:
- DirtPiles
- Self
Positions:
- (3,1) # Agent spawnpoint
Sigmund:
Actions:
- Move8
- DoorUse
- Noop
Observations:
- DirtPiles
- Self
Positions:
- (3,13)
Entities:
DirtPiles:
coords_or_quantity: (3,12), (3,2)
initial_amount: 0.5 # <1 to ensure that the robot which first attempts to clean this field, can remove the dirt in one action
clean_amount: 1
dirt_spawn_r_var: 0
max_global_amount: 12
max_local_amount: 1
Doors: { }
Rules:
# Environment Dynamics
DoorAutoClose:
close_frequency: 10
# Utilities
# This rule defines the collision mechanic, introduces a related DoneCondition and lets you specify rewards.
WatchCollisions:
done_at_collisions: false
# Done Conditions
#DoneOnAllDirtCleaned:
#DoneAtMaxStepsReached:
#max_steps: 100