alg: "coma"

alg_args:
    "policy_lrate": 1.0e-4
    "value_lrate": 1.0e-4
    "sample_size": 10
    "gaussian_policy": False
    "action_enforcebound": True