def default_cfg():
    return {
    # PPO
    "LR": 3e-4, "NUM_ENVS": 16, "NUM_STEPS": 1024, "TOTAL_TIMESTEPS": 1e8,
    "UPDATE_EPOCHS": 4, "NUM_MINIBATCHES": 32, "GAMMA": 0.99, "GAE_LAMBDA": 0.95,
    "CLIP_EPS": 0.2, "ENT_COEF": 0.00, "VF_COEF": 0.5, "MAX_GRAD_NORM": 0.5,
    "ACTIVATION": "tanh", "ENV_NAME": "ant", "ANNEAL_LR": False, "NORMALIZE_ENV": False,
    # RAPO (ensemble only)
    "M_NEXT": 8, "ADV_STEPS": 2, "ADV_LR": 3e-4, "ADV_USE_ACTION": True,
    "KL_DELTA": 0.05, "KL_EPS": 1e-3, "ADV_KL_PENALTY": 10.0,
    "NUM_MODEL_ENVS": 8, "RHO_THETA": 0.2, "THETA_UPDATE_SUBSAMPLE": 256,
    "THETA_PRIOR_MASS_STD": 0.05, "THETA_PRIOR_INERTIA_STD": 0.05, "THETA_PRIOR_FRICTION_STD": 0.05,
    "THETA_PRIOR_TORQUE_STD": 0.05, "THETA_PRIOR_COM_STD": 0.005,
    "THETA_SCALE_MIN": 0.8, "THETA_SCALE_MAX": 1.2, "THETA_COM_ABSMAX": 0.00,
    "BRAX_BACKEND": "positional", "DEBUG": True,
    # logging/save
    "LOG_DIR": "runs",
    "SAVE_EVERY_UPDATES": 10,
    "PRINT_EVERY_UPDATES": 1,
    }