method: "ngt"
out_size: 32
v2: false
ngt_loss: "huber"

temperature: 1.0
tighter_percentile_range: true  # 05-95 if false, 10-90 if true
stretch_with_symexp: false  # wrap final reward with symexp temperature 1.0

p_proportion_of_exp_per_update: 1.0
e_proportion_of_exp_per_update: 1.0
advers_p_ascent_scale: 1.0

pretrain: false
