CUDA_VISIBLE_DEVICES=1 python pretrain.py \
    seed=7 \
    bonus=0.5 \
    task=walker_run \
    supervised=True \
    agent=ddpg \
    agent.nstep=1 \
    agent.batch_size=1024 \
    obs_type=states \
    action_repeat=1 \
    num_train_frames=4000010 \
    replay_buffer_size=100000 \
    replay_buffer_num_workers=4 \
    save_replay_buffer=True \
    project=MaskDP_state_data \
    use_wandb=True &
sleep 60 
CUDA_VISIBLE_DEVICES=1 python pretrain.py \
    seed=7 \
    bonus=0.5 \
    task=walker_walk \
    agent=ddpg \
    supervised=True \
    agent.nstep=1 \
    agent.batch_size=1024 \
    obs_type=states \
    action_repeat=1 \
    num_train_frames=4000010 \
    replay_buffer_size=100000 \
    replay_buffer_num_workers=4 \
    save_replay_buffer=True \
    project=MaskDP_state_data \
    use_wandb=True &
sleep 60
CUDA_VISIBLE_DEVICES=1 python pretrain.py \
    seed=7 \
    bonus=0.5 \
    task=walker_stand \
    supervised=True \
    agent=ddpg \
    agent.nstep=1 \
    agent.batch_size=1024 \
    obs_type=states \
    action_repeat=1 \
    num_train_frames=4000010 \
    replay_buffer_size=100000 \
    replay_buffer_num_workers=4 \
    save_replay_buffer=True \
    project=MaskDP_state_data \
    use_wandb=True