#!/bin/bash

export DOMAIN=carla
export SCENARIOS=highway
export TASK=HighwayLimit
export LOSS_TYPE=value
export SAVEDIR=./save
mkdir -p ${SAVEDIR}
export CRITIC_PATH=/home/xxxx/carla_HighwayLimit_pretrain_Qwen_2B_loss_seed:1_2025-02-24-08-12-24/model

CUDA_VISIBLE_DEVICES=4 python train_carla_fusion.py \
    --port 20006\
    --trafficManagerPort 20506\
    --domain_name ${DOMAIN} \
    --task_name ${TASK} \
    --scenarios ${SCENARIOS} \
    --loss_type ${LOSS_TYPE} \
    --data_augs no_aug  \
    --agent 'deepmdp' \
    --init_steps 1000 \
    --num_train_steps 100000 \
    --encoder_type pixelCarla \
    --decoder_type identity \
    --img_source video \
    --resource_files 'distractors/*.mp4' \
    --action_repeat 4 \
    --critic_tau 0.01 \
    --encoder_tau 0.05 \
    --decoder_weight_lambda 0.0000001 \
    --hidden_dim 1024 \
    --total_frames 10000 \
    --num_filters 32 \
    --batch_size 128 \
    --init_temperature 0.1 \
    --alpha_lr 1e-4 \
    --alpha_beta 0.5 \
    --work_dir ${SAVEDIR}/${DOMAIN}_${TASK}_${LOSS_TYPE} \
    --seed 1 $@ \
    --frame_stack 3 \
    --image_size 128 \
    --eval_freq 100 \
    --num_eval_episodes 20 \
    --vlm_freq 10 \
    --load_critic_best 0 \
    --critic_best_path ${CRITIC_PATH} \
    --save_tb \
    --save_model \
    --save_video \
    # --save_buffer \
    # --render