wandb disabled
export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/root/.mujoco/mujoco210/bin
export D4RL_SUPPRESS_IMPORT_ERROR=1
# export CUDA_VISIBLE_DEVICES=0
# export WANDB_DISABLED=True
# halfcheetah-medium-v2 walker2d-medium-v2 hopper-medium-v2 ant-medium-v2
export env=$1
export seed=$3
proj_name=td3_bc_wo_cql_1_5
CUDA_VISIBLE_DEVICES=$2 XLA_PYTHON_CLIENT_PREALLOCATE=false python -m JaxCQL.conservative_td3bc_main \
                                                                    --env $env \
                                                                    --logging.online \
                                                                    --seed $3 \
                                                                    --logging.project=Cal-QL-exapmle \
                                                                    --cql_min_q_weight=5.0 \
                                                                    --cql.cql_target_action_gap=0.8 \
                                                                    --cql.cql_lagrange=False \
                                                                    --policy_arch=256-256 \
                                                                    --qf_arch=256-256-256-256 \
                                                                    --offline_eval_every_n_epoch=50 \
                                                                    --online_eval_every_n_env_steps=2000 \
                                                                    --eval_n_trajs=20 \
                                                                    --n_train_step_per_epoch_offline=1000 \
                                                                    --n_pretrain_epochs=1000 \
                                                                    --max_online_env_steps=1e6 \
                                                                    --mixing_ratio=0.5 \
                                                                    --reward_scale=10.0 \
                                                                    --reward_bias=-5 \
                                                                    --enable_calql=False \
                                                                    --logging_path=./${proj_name}/${env}/$seed
