CartPoleSwingUp:
  observation_space: 5
  action_space: 1
  sa_dimension: 6
  dataset0:
    pibs: [5_000, 10_000, 20_000]
    mix: [0.334, 0.333, 0.333]
    num_samples: 100_000
CheetahRun:
  observation_space: 17
  action_space: 6
  sa_dimension: 23
  dataset0:
    pibs: [10_000, 50_000, 100_000]
    mix: [0.334, 0.333, 0.333]
    num_samples: 100_000
  dataset1:
    pibs: [10_000]
    mix: [1.0]
    num_samples: 100_000

FingerEasy:
  observation_space: 12
  action_space: 2
  sa_dimension: 14
  dataset0:
    pibs: [20_000, 200_000, 300_000]
    mix: [0.334, 0.333, 0.333]
    num_samples: 100_000

WalkerStand:
  observation_space: 24
  action_space: 6
  sa_dimension: 30
  dataset0:
    pibs: [20_000, 40_000, 100_000]
    mix: [0.334, 0.333, 0.333]
    num_samples: 100_000
  dataset1:
    pibs: [20_000]
    mix: [1.0]
    num_samples: 100_000
Walker:
  observation_space: 17
  action_space: 6
  random: [0., 0., 1.]
  medium: [0., 1., 0.]
  medium-expert: [0.5, 0.5, 0.]
  expert: [1., 0., 0.]
  d4rl:
    expert: 10
    medium: 5
    pi_url: 'walker_online_{}.pkl'
Cheetah:
  observation_space: 17
  action_space: 6
  random: [0., 0., 1.] # mix proportions (see above)
  medium: [0., 1., 0.]
  medium-expert: [0.5, 0.5, 0.]
  expert: [1., 0., 0.]
  d4rl:
    expert: 10
    medium: 5
    pi_url: 'halfcheetah_online_{}.pkl'
Hopper:
  observation_space: 11
  action_space: 3
  random: [0., 0., 1.]
  medium: [0., 1., 0.]
  medium-expert: [0.5, 0.5, 0.]
  expert: [1., 0., 0.]
  d4rl:
    expert: 10
    medium: 5
    pi_url: 'hopper_online_{}.pkl'
