domain:
  _target_: domains.graph
  make_pomdp: False
  number_of_pomdp_states: 2
  transitions_deterministic: True
  max_length: 8   
  sparse_rewards: False
  stochastic_rewards: False
  reward: 'one'  # 'one', 'rand'

exp:
  each_query: 1
  warmup_sample: 0.

  softmax_af: False
  af_thre: 0
  
  qiterations: 10
  qalpha: 0.05

  decay: 'linear'  # concave, convex, linear
  fixeddecay: True
  fixtime: 0.5
  decay_temp: 6.
  packbits: False

  algo: guided  # guided, visit, uniform
  impute: none  # zero, mean, max, min, gt, none

  qfunction:
    _target_: models.qtable

  il:
    _target_: models.il
