defaults:
  - finetuning_base_config
  - data@dataset: tt_dataset
  - data@buffer: ReplayBuffer
  - model: ShortCircuit
  - loss@value_loss: MSELoss
  - loss@policy_loss: KLDivLoss
  - policy@AZ: AlphaZeroPolicy
  - policy@HER: HERPolicy
  - optimizer: AdamW
  - scheduler: CosineAnnealingWarmRestarts
  - _self_


debug: false
