# @package pi

_target_: policy_learner.BCLearner
name: bc

model_save_path: ${path}/models/${name}_${pi.name}_${env.name}.pt

device: ${device}
discount: ${discount}

# training parameters 
batch_size: 512
lr: 1e-4
state_dim: ${state_dim}
action_dim: ${action_dim}

# model parameters
width: 1024
depth: 2
dist_type: trunc

# logging 
format_str: "Pi Train: Step {values[step]:8.0f}, Loss {values[loss]:2.6f},  Entropy {values[entropy]:4.4f}"
