class Names: ENV = 'env' ENV_NAME = 'env_name' N_AGENTS = 'n_agents' ALGORITHM = 'algorithm' MAX_STEPS = 'max_steps' N_STEPS = 'n_steps' TRAIN_RENDER = 'train_render' EVAL_RENDER = 'eval_render' AGENT = 'Agent' PILE_OBSERVABILITY = 'pile-observability' PILE_ORDER = 'pile-order' ALL = 'all' FIXED = 'fixed' AGENTS = 'agents' DYNAMIC = 'dynamic' SMART = 'smart' DIRT_PILES = 'DirtPiles' AUXILIARY_PILES = "auxiliary_piles" DOORS = 'Doors' DOOR = 'Door' GAMMA = 'gamma' ADVANTAGE = 'advantage' REINFORCE = 'reinforce' ADVANTAGE_AC = "Advantage-AC" TD_ADVANTAGE_AC = "TD-Advantage-AC" CHUNK_EPISODE = 'chunk-episode' POS_POINTER = 'pos_pointer' POSITIONS = 'positions' SAVE_AND_LOG = 'save_and_log' NOOP = 'Noop' USE_DOOR = 'use_door' PILE_ALL_DONE = 'pile_all_done' SINGLE = 'single' DISTRIBUTED = 'distributed' SHARED = 'shared' EARLY_STOPPING = 'early_stopping' TRAIN = 'train' SEED = 'seed' LAST_N_EPISODES = 'last_n_episodes' MEAN_TARGET_CHANGE = 'mean_target_change' WANDB_LOG = 'wandb_log'