# @package pi

_target_: policy_learner.ExpWeightLearner
name: exp_weight

load_path: null
model_save_path: ${path}/models/${name}_${pi.name}_${env.domain}.pt

device: ${device}
discount: ${discount}

# alg specific parameters
temp: 0.01

# training parameters 
batch_size: 512
lr: 1e-4
state_dim: ${state_dim}
action_dim: ${action_dim}

# model parameters
width: 1024
depth: 2
dist_type: trunc

# logging 
format_str: "Pi Train: Step {values[step]:8.0f}, Loss {values[loss]:2.6f},  Entropy {values[entropy]:4.4f}, Imitation Loss {values[imitation]:4.4f}"