# diffbc.yaml

planner: 
  training:
    total_timesteps: 100_000
    log_interval: 10_000
  params:
    policy: !!python/name:diffgro.diffbc.policies.DiffBCPlannerPolicy ''
    learning_rate: !!float 1e-4
    batch_size: 8 # per task
  policy_kwargs:
    net_arch:
      act:
        - 128
        - 128
        - 128
    activation_fn: "mish"
    sem_dim: 512
    emb_dim: 128
    n_denoise: 64 
    predict_epsilon: False
    beta_scheduler: "cosine"
    normalization_class: !!python/name:sb3_jax.common.norm_layers.RunningNormLayer ''
