SEED=1

python -m train \
    --xpid=ued-BipedalWalker-Adversarial-v0-domain_randomization-noexpgrad-lr0.0003-epoch5-mb32-v0.5-gc0.5-henv0.01-ha0.001-plr0.5-rho0.5-n1000-st0.5-positive_value_loss-rank-t0.1-tl_0 \
    --env_name=BipedalWalker-Adversarial-v0 \
    --use_gae=True \
    --gamma=0.99 \
    --gae_lambda=0.9 \
    --seed=${SEED} \
    --num_control_points=12 \
    --recurrent_arch=lstm \
    --recurrent_agent=False \
    --recurrent_adversary_env=False \
    --recurrent_hidden_size=1 \
    --use_global_critic=False \
    --lr=0.0003 \
    --num_steps=2048 \
    --num_processes=16 \
    --num_env_steps=2000000000 \
    --ppo_epoch=5 \
    --num_mini_batch=32 \
    --entropy_coef=0.001 \
    --value_loss_coef=0.5 \
    --clip_param=0.2 \
    --clip_value_loss=False \
    --adv_entropy_coef=0.01 \
    --max_grad_norm=0.5 \
    --algo=ppo \
    --ued_algo=domain_randomization \
    --use_plr=True \
    --level_replay_prob=0.5 \
    --level_replay_rho=0.5 \
    --level_replay_seed_buffer_size=1000 \
    --level_replay_score_transform=rank \
    --level_replay_temperature=0.1 \
    --staleness_coef=0.5 \
    --no_exploratory_grad_updates=True \
    --use_editor=False \
    --level_editor_prob=0 \
    --level_editor_method=random \
    --num_edits=0 \
    --base_levels=batch \
    --use_accel_paired=False \
    --accel_paired_score_function=paired \
    --use_lstm=False \
    --use_behavioural_cloning=False \
    --kl_loss_coef=0.0 \
    --kl_update_step=1 \
    --use_kl_only_agent=False \
    --log_interval=10 \
    --screenshot_interval=200 \
    --log_grad_norm=True \
    --normalize_returns=True \
    --checkpoint_basis=student_grad_updates \
    --archive_interval=1000 \
    --reward_shaping=True \
    --use_categorical_adv=True \
    --use_skip=False \
    --choose_start_pos=False \
    --sparse_rewards=False \
    --handle_timelimits=True \
    --level_replay_strategy=positive_value_loss \
    --test_env_names=BipedalWalker-v3,BipedalWalkerHardcore-v3,BipedalWalker-Med-Stairs-v0,BipedalWalker-Med-PitGap-v0,BipedalWalker-Med-StumpHeight-v0,BipedalWalker-Med-Roughness-v0  \
    --log_dir=logs/BW_PLR_${SEED} \
    --test_interval=1000 \
    --test_num_episodes=128 \
    --test_num_processes=2 \
    --log_plr_buffer_stats=True \
    --log_replay_complexity=True \
    --checkpoint=True \
    --log_action_complexity=False