defaults:
  - mappo_cermic_config
  - _self_


share_param_critic: True
clip_epsilon: 0.2
entropy_coef: 0.0
critic_coef: 1.0
loss_critic_type: "l2"
lmbda: 0.9
scale_mapping: "biased_softplus_1.0"
use_tanh_normal: True
minibatch_advantage: False

# CERMIC Module Configuration
cermic_tau: 0.05  # Momentum network update rate
cermic_loss_var_weight: 1.0  # Variational loss weight
cermic_loss_l2_weight: 1.0  # L2 reconstruction loss weight
cermic_loss_nce_weight: 1.0  # NCE contrastive loss weight
cermic_aug: True  # Whether to use data augmentation
cermic_intrinsic_reward_coef: 0.05  # Intrinsic reward coefficient 