{
    "MDP": {
        "name": "<class 'simple_rl.tasks.grid_world.GridWorldMDPClass.GridWorldMDP'>",
        "params": {
            "width": 6,
            "height": 6,
            "init_loc": {
                "__tuple__": true,
                "items": [
                    1,
                    1
                ]
            },
            "rand_init": false,
            "goal_locs": [
                {
                    "__tuple__": true,
                    "items": [
                        5,
                        1
                    ]
                }
            ],
            "lava_locs": [
                {
                    "__tuple__": true,
                    "items": [
                        3,
                        2
                    ]
                },
                {
                    "__tuple__": true,
                    "items": [
                        1,
                        4
                    ]
                },
                {
                    "__tuple__": true,
                    "items": [
                        2,
                        4
                    ]
                },
                {
                    "__tuple__": true,
                    "items": [
                        2,
                        5
                    ]
                }
            ],
            "walls": [
                {
                    "__tuple__": true,
                    "items": [
                        3,
                        1
                    ]
                }
            ],
            "is_goal_terminal": true,
            "gamma": 0.99,
            "slip_prob": 0.0,
            "step_cost": 0,
            "lava_cost": 1.0
        }
    },
    "AGENTS": {
        "<class 'simple_rl.agents.QLearningAgentClass.QLearningAgent'>": {
            "params": {
                "alpha": 0.1,
                "gamma": 0.99,
                "epsilon": 0.1,
                "anneal": false,
                "explore": "uniform"
            },
            "index": 0
        },
        "<class 'rlang.agents.RLangQLearningAgentClass.RLangQLearningAgent'>": {
            "params": {
                "alpha": 0.1,
                "gamma": 0.99,
                "epsilon": 0.1,
                "anneal": false,
                "explore": "uniform"
            },
            "index": 1
        }
    },
    "MISC": {
        "instances": 5,
        "episodes": 100,
        "steps": 200,
        "track_disc_reward": false
    },
    "FUNC": "run_agents_on_mdp"
}