experiments:
  glb_default:
    problem: glb
    parameters:
      T: 50000
      num_actions: 100
      d: 10
      noise_variance: 0.01
      theta_bound: 1.0
      action_bound: 1.0
      mean_low: -1.0
      mean_high: 1.0
      reward_bound: 1.0
      xi: 0.4
      seed: 205
    algorithms:
      - template: dal_glb
      - template: dal_glb_gsr
      - template: glb_weight_ucb
      - template: glb_restart
      - template: glb_dglucb
      - template: glb_swglucb
      - template: glb_bvd
    runs:
      n_mc: 15
      n_jobs: -1
    output:
      save: results/glb_default_v2.pkl
      plot: true

  lb_default:
    problem: lb
    parameters:
      T: 50000
      num_actions: 100
      d: 10
      noise_variance: 0.01
      theta_bound: 1.0  
      action_bound: 1.0
      xi: 0.4
      seed: 205
    algorithms:
      - template: master_lb
      - template: dal_lb
      - template: dal_lb_gsr
      - template: lb_weight_ucb
      - template: lb_restart 
      - template: lb_window
      - template: lb_dlin
    runs:
      n_mc: 15
      n_jobs: -1
    output:
      save: results/lb_default_v2.pkl
      plot: true

  lb_ball:
    problem: lb_ball
    parameters:
      T: 50000
      num_actions: 100
      d: 5
      noise_variance: 0.1
      theta_bound: 1.0
      action_bound: 1.0
      radius: 0.08
      xi: 0.4
      seed: 205
      mean_low: -1.0
      mean_high: 1.0
      continuous: true
    algorithms:
      - template: dal_lb
      - template: dal_lb_gsr
      - template: lb_weight_ucb
    runs:
      n_mc: 30
      n_jobs: -1
    output:
      save: results/lb_ball.pkl
      plot: true

  scb_default:
    problem: scb
    parameters:
      T: 50000
      num_actions: 100
      d: 10
      noise_variance: 0.01
      theta_bound: 3.0
      action_bound: 1.0
      reward_bound: 1.0
      xi: 0.4
      seed: 205
    algorithms:
      - template: master_scb
      - template: scb_weight_ucb
      - template: dal_ofu_glb
      - template: dal_ofu_glb_gsr
      - template: scb_dglb
      - template: scb_restart
    runs:
      n_mc: 15
      n_jobs: -1
    output:
      save: results/scb_default.pkl
      plot: true

  kb_default:
    problem: kb
    parameters:
      T: 50000
      num_actions: 100
      d: 10
      noise_variance: 0.01
      reward_bound: 0.8
      kernel_length_scale: 0.2
      tol: 0.1
      xi: 0.4
      seed: 205
      mean_low: -1.0
      mean_high: 1.0
      reward_generation_method: kernel_sum
    algorithms:
      - template: opkb_kb
      - template: gp_ucb
      - template: dal_kb
      - template: dal_kb_gsr
      - template: gp_ucb_r
      - template: gp_ucb_sw
    runs:
      n_mc: 15
      n_jobs: -1
    output:
      save: results/kb_default.pkl
      plot: true


  cb_default:
    problem: cb
    simulation: contextual
    parameters:
      T: 50000
      num_actions: 100
      d: 10
      d_ctx: 10
      noise_variance: 0.01
      reward_bound: 1.0
      action_bound: 1.0
      context_mode: finite
      xi: 0.4
      seed: 205
      policy_count: 100
      mean_low: -1.0
      mean_high: 1.0
    algorithms:
      - template: dal_context
      - template: dal_context_gsr
      - template: adailtcb_plus
      - template: master_context
    runs:
      n_mc: 15
      n_jobs: -1
    output:
      save: results/cb_default.pkl
      plot: true
