env: gym.Ant-v3

max_episode_steps: 100
max_test_episode_steps: 500

collected_trajectories: 1e2
alpha: 60.0
beta: 1.0

# Variable length

# num_train_steps: 5e6
# num_steps_per_skill: 
#   - 25e4
#   - 25e4
#   - 1e6
#   - 1e6
#   - 5e4
#   - 5e4
#   - 5e4
#   - 5e4
#   - 25e4
#   - 25e4
# replay_buffer_capacity: 2e6

# num_seed_steps: 5000
# eval_frequency: 50

# Test config

num_train_steps: 1000
num_steps_per_skill:
  - 100
  - 200
  - 300
  - 400
replay_buffer_capacity: 1000

num_seed_steps: 5
eval_frequency: 5
