deep-ope:
  common: # common setup to all algorithms
    phi_hidden_dim: 1024
    phi_num_hidden_layers: 1
    phi_norm_type: layer
    phi_hard_update_freq: 1
    phi_act_function: relu
    mini_batch_size: 2048
    hps:
      phi_outdim: [7]
      phi_hard_update_freq: [1]
      phi_lr: [1e-5] 
  algorithms:
    FQE:
      encoder_name: fqe
      phi_use_penultimate: True
    KROPE:
      encoder_name: fqeaux-krope
      phi_use_penultimate: True
    BCRL:
      encoder_name: fqeaux-bcrl
      phi_use_penultimate: True
      bcrl_norm_selfpred: False
      M_lr: 1e-4
    DR3:
      encoder_name: fqeaux-dr3
      phi_use_penultimate: True
    BEER:
      encoder_name: fqeaux-beer
      phi_use_penultimate: True

tabular-ope:
  common: # common setup to all algorithms
    phi_hidden_dim: 0
    phi_num_hidden_layers: 0
    phi_norm_type: none
    clip_target: True
    mini_batch_size: 2048
    hps:
      #lam_inv: [1e-3]
      #batch_size: [1, 10, 50, 100, 500]
      phi_outdim: [20]
      phi_hard_update_freq: [1]
      phi_lr: [1e-4] 
      #mix_ratio: [0.05, 0.1, 0.2, 0.3, 0.4, 0.5]
      #mix_ratio: [0.15, 0.25]
    #pw_dataset: True
    roy_off_type: random
  algorithms:
    FQE:
      encoder_name: fqe
      phi_use_penultimate: True
    KROPE:
      encoder_name: fqeaux-krope
      phi_use_penultimate: True
    BCRL:
      encoder_name: fqeaux-bcrl
      phi_use_penultimate: True
      bcrl_norm_selfpred: False
      M_lr: 1e-4
    DR3:
      encoder_name: fqeaux-dr3
      phi_use_penultimate: True
    BEER:
      encoder_name: fqeaux-beer
      phi_use_penultimate: True
    # identity:
    #   encoder_name: identity
    # bcrl:
    #   encoder_name: bcrl
    #   bcrl_norm_selfpred: False
    #   M_lr: 1e-3
    # bcrl-lat:
    #   encoder_name: bcrl-lat
    #   bcrl_norm_selfpred: False
    #   M_lr: 1e-3
    # bcrl-logdet:
    #   encoder_name: bcrl
    #   bcrl_norm_selfpred: True
    #   bcrl_logdet: 1e-2
    # krope0:
    #   encoder_name: krope
    #   roy_sample_num: 0
    # krope1:
    #   encoder_name: krope
    #   roy_sample_num: 1
    # krope2:
    #   encoder_name: krope
    #   roy_sample_num: 2
    # krope3:
    #   encoder_name: krope
    #   roy_sample_num: 3
