# ===================
# ====== task ======
# ===================
task_set: "general" # "general" or "webshop"
task_split: "train" # "train" or "test"
eval_sample_mode: "random"
max_steps: 10 # AitW General 10; AitW Web Shopping 20

# ===================
# ====== token ======
# ===================
huggingface_token: ''
wandb_key: ''
gemini_key: ''

# ===================
# ====== algo ======
# ===================
policy_ref_lm: '/home/<username>/autoui/Auto-UI-Base'
policy_lm: '/home/<username>/autoui/Auto-UI-Base'
critic_lm: 'roberta-base'
capacity: 2000 # replay buffer size
epochs: 5 # number of epochs for the critic each witeration
batch_size: 4
bsize: 8 # number of emulators parallelly on the machine
rollout_size: 16 # how many trajectories to collect between training iterations (should be multiple of bsize)
grad_accum_steps: 32
warmup_iter: 0 # how many iterations to only collect data and evaluate before training
actor_epochs: 20 # number of epochs for training the actor each iteration
trajectory_critic_epochs: 5 # 5
lm_lr: 1e-4
critic_lr: 1e-4
max_grad_norm: 0.01
gamma: 0.5

# ===================
# ====== agent ======
# ===================
use_lora: False
agent_name: "autoui" 
do_sample: True
temperature: 1.0
tau: 0.01 #soft update parameter
max_new_tokens: 128

# ===================
# ====== log ======
# ===================
record: False
use_wandb: True
entity_name: ''
project_name: ''

# ===================
# ====== path ======
# ===================
# query by: echo $ANDROID_AVD_HOME
android_avd_home: '/home/<username>/.android/avd'
# query by: which emulator
emulator_path: '/home/<username>/.android/emulator/emulator'
# query by: which adb
adb_path: '/home/<username>/.android/platform-tools/adb'
cache_dir: '/home/<username>/.cache'
assets_path: '/home/<username>/vscrl/vscrl/environment/android/assets/task_set'