name: test

check_already_ran: True
overwrite: True

local: True
blob: False

alg: rl

env_type: atari
env_id: Breakout
norm: scale
network: dqn

run: 1
num_shards: 1

b_config: train_bc_atari
b_step: 100000 
b_network: dqn
b_norm: scale
b_lr: 0.0003

wrap_unc: True
unc_type: s

unc_config: train_uncertainty_atari
unc_step: 100000
unc_network: dqn
unc_n_comp: 5
unc_feature_dim: 64
unc_noise_scale: 0.0
unc_prior_scale: 1.0
unc_beta: 1.0
unc_norm: scale
unc_seed: 0
unc_lr: 0.0001

learner: cql
actor: greedy
min_prob: 0.01

use_heuristic: True
epsilon: 0.0
tau: 0.0
alpha: 0.0

train_steps: 1000001
eval_period: 100000
eval_episodes: 5
ckpt_period: 500000

seed: 0
batch_size: 256
lr: 0.00003
target_update_period: 2500
discount: 0.99

width: None
unc_width: None
b_width: None

