from rlutils.rewards.models import RewardTree

P = {
    "pbrl": {
        "reward_source": "model",
        "model": {
            "class":              RewardTree,
            "num_from_queue":     float("inf"),
            "min_samples_leaf":   1,
            "m_max":              100,
            "preference_eqn":     "bradley-terry",
            "store_all_qual":     False,
            "split_dim_entropy":  0., 
            "nodewise_partition": False,
            "split_by_preference": False,
            "loss_func": "bce",
            "alpha": 0.005,
            "prune_ratio": None,
            "trees_per_update": 1,
            "forest_size": 1,
            "sort_forest_by": "age"
        }
    }
}
