# @package agent
_target_: agent.potil.POTILAgent
obs_shape: ??? # to be specified later
action_shape: ??? # to be specified later
device: ${device}
lr: 1e-4
critic_target_tau: 0.005
update_every_steps: 2
use_tb: ${use_tb}
num_expl_steps: 2000
hidden_dim: ${suite.hidden_dim}
feature_dim: 50
stddev_schedule: 0.1 #'linear(1.0,0.1,500000)'
stddev_clip: 0.3
expl_stddev: # for expl_mode 
expl_noise: 'linear(0.5,0.2,500000)'
expl_mode:
expl_offset: 
update_policy_freq: 1
augment: True
rewards: sinkhorn_cosine
sinkhorn_rew_scale: 200
update_target_every: 10000
auto_rew_scale: True
auto_rew_scale_factor: 10
auto_rew_scale_wo_truncate: False
suite_name: ${suite.name}
obs_type: ${obs_type}
bc_weight_type: ${bc_weight_type}
bc_weight_schedule: 'linear(1.0,0.1,20000)'
bandwidth: 10000
name: 'potil'
use_trunk: false
timestamp: ${suite.timestamp}
timestamp_onehot: ${suite.timestamp_onehot}
timestamp_dim: ${suite.timestamp_dim}
ot_truncate:
use_inverse_dynamics: false
alpha: 0.4
use_timeout: false
cost_bias: 0
countdown_scale: # None by default
countdown_noise: false
nstep: ${nstep}
timeout_mean_reward: false