domain:
  _target_: domains.minatarenv
  envname: breakout
  expert_policy_path: 'breakout/model/model_data_and_weights'

exp:
  each_query: 250
  initial_sample: 250

  softmax_af: False
  af_thre: 0.9

  qiterations: 0
  qalpha: 0
  
  algo: visit  # guided, visit, uniform
  impute: none  # zero, mean, max, min, gt, none

  decay: 'concave'  # concave, convex, linear
  fixeddecay: True
  fixtime: 0.5
  decay_temp: 6.
  packbits: True

  qfunction:
    _target_: models.dqn
    tau: 0.7
    beta: 3.0
    alpha: 0.005
    batch_size: 256
    num_epochs: 125_000

  il:
    _target_: models.dil
    num_epochs: 125_000
    batch_size: 256
    load_path: 'breakout/model/il_weights'
