baseline: "rnd"
input_type: "obs_feat"
expl_seq_len: 1
k_expl: 0.05
anneal_k: False