27 lines
688 B
YAML
27 lines
688 B
YAML
agent:
|
|
classname: studies.sat_mad.A2CAgent
|
|
observation_size: 4*5*5
|
|
hidden_size: 128
|
|
n_actions: 10
|
|
|
|
env:
|
|
classname: environments.factory.make
|
|
env_name: "DirtyFactory-v0"
|
|
n_agents: 1
|
|
pomdp_r: 2
|
|
max_steps: 400
|
|
stack_n_frames: 3
|
|
individual_rewards: True
|
|
|
|
algorithm:
|
|
max_epochs: 1000000
|
|
n_envs: 1
|
|
n_timesteps: 10
|
|
discount_factor: 0.99
|
|
entropy_coef: 0.01
|
|
critic_coef: 1.0
|
|
gae: 0.25
|
|
optimizer:
|
|
classname: torch.optim.Adam
|
|
lr: 0.0003
|
|
weight_decay: 0.0 |