env1:
    env_name: sokoban
    env_config:
        render_mode: vision
        prompt_format: free_think
        use_state_reward: false
    train_size: 10000
    test_size: 128