# Original implementation: https://github.com/abaisero/gym-gridverse
#
####
#
# Extended to informed POMDPs by anonymous authors (2025)
#
####

state_space:
  objects: [ Wall, Floor, Exit, Beacon ]
  colors: [ NONE, RED, GREEN, BLUE, YELLOW ]

action_space:
  - MOVE_FORWARD
  - MOVE_BACKWARD
  - MOVE_LEFT
  - MOVE_RIGHT
  - TURN_LEFT
  - TURN_RIGHT

observation_space:
  objects: [ Wall, Floor, Exit, Beacon ]
  colors: [ NONE, RED, GREEN, BLUE, YELLOW ]

# information space definition
information_space:
  objects: [ Wall, Floor, Exit, Beacon ]
  colors: [ NONE, RED, GREEN, BLUE, YELLOW ]

reset_function:
  name: memory_rooms
  shape: [ 7, 7 ]
  layout: [ 2, 2 ]
  colors: [ RED, GREEN, BLUE, YELLOW ]
  num_beacons: 1
  num_exits: 2

transition_functions:
  - name: move_agent
  - name: turn_agent

reward_functions:
  - name: reach_exit_memory
    reward_good: 5.0
    reward_bad: -5.0
  - name: living_reward
    reward: -0.05

# 3x2x3 observation tensor
observation_function:
  name: partially_occluded
  area: [ [-1, 0 ], [-1, 1 ] ]

# larger information tensor
information_function:
  name: partially_occluded
  area: [ [-3, 0 ], [-2, 2 ] ]

terminating_function:
  name: reach_exit
