P = {
    "deployment": {
        "train": True,
        "agent": None,
        "observers": {}
    },
    "pbrl": {
        "reward_source": "oracle"
    }  
}
