_target_: lambda_ac.util.planning_strategies.TdmpcStrategy

#action_dim: ${env.action_dim}
model: ${agent.model}
critic: ${agent.critic}
actor: ${agent.actor}

# Schedules for inference 
std_schedule:
  _target_: lambda_ac.util.schedulers.LinearSchedule
  start: 0.5
  final: ${agent.planning_strategy.min_std}
  duration: 25000

horizon_schedule: 
  _target_: lambda_ac.util.schedulers.LinearSchedule
  start: 4
  final: 5
  duration: 25000

# Hyper params 
horizon: 5
seed_steps: ${initial_steps}
action_dim: ${env.action_dim}

iterations: 6
# Note that this is the same as batch_size in the paper, not sure if should have ${batch_size} or is independant
num_samples: 512
num_elites: 64
mixture_coef: 0.05
min_std: 0.05
temperature: 0.5
momentum: 0.1

discount: ${agent.actor_gamma}
discretize_done: ${agent.discretize_done_actor}
update_encoder_actor: ${agent.update_encoder_actor}
device: ${device}
share_encoder: ${agent.share_encoder}