#!/bin/sh
env="hands"
task="ShadowHandDoorOpenInward"
algo="mat"
exp="test_gail_ppoEpoch10_discEpoch5_discLr1e-5"
seed=1

echo "env is ${env}, task is ${task}, algo is ${algo}, exp is ${exp}, seed is ${seed}"
CUDA_VISIBLE_DEVICES=0 python train/train_hands_offline.py --env_name ${env} --seed ${seed} --algorithm_name ${algo} \
--experiment_name ${exp} --task ${task} --n_rollout_threads 80 --lr 5e-5 --disc_lr 1e-5 --entropy_coef 0.001 --max_grad_norm 0.5 \
--log_interval 10 --n_training_threads 16 --num_mini_batch 1 --num_env_steps 50000000 --ppo_epoch 10 \
--clip_param 0.2 --use_value_active_masks --add_center_xy --use_state_agent --use_policy_active_masks \
--save_interval 10 --num_epochs 10000 --num_steps_per_epochs 5000 --quick_tqdm \
--use_gail --normalize_advantage --epoch_disc 5 \
--train_data_path "/home/LAB/qiuyue/language_condition_MAT/scripts/data/ShadowHandDoorOpenInward/happo.pkl"