export LD_LIBRARY_PATH=$EBROOTCUDNN/lib
export ROOT_DIR=/logs/ibm01_to_ariane_finetuning
export REVERB_PORT=8008
export REVERB_SERVER="127.0.0.1:${REVERB_PORT}"
export NETLIST_FILE=./circuit_training/environment/test_data/ariane/netlist.pb.txt
export INIT_PLACEMENT=./circuit_training/environment/test_data/ariane/initial.plc
export CHKPT_DIR=/logs/run_ibm01_scratch/55/train/checkpoints
export PLCY_DIR=/logs/run_ibm01_scratch/55/policies/greedy_policy

python -m circuit_training.learning.ppo_reverb_server --root_dir=${ROOT_DIR}  --port=${REVERB_PORT} &
python -m circuit_training.learning.fine_tune_target_ppo --root_dir=${ROOT_DIR} --parent_chkpt_dir=${CHKPT_DIR} --parent_policy_dir=${PLCY_DIR} --replay_buffer_server_address=${REVERB_SERVER} --variable_container_server_address=${REVERB_SERVER} --num_episodes_per_iteration=16 --global_batch_size=64 --netlist_file=${NETLIST_FILE} --init_placement=${INIT_PLACEMENT} &
python -m circuit_training.learning.ppo_collect --root_dir=${ROOT_DIR} --replay_buffer_server_address=${REVERB_SERVER} --variable_container_server_address=${REVERB_SERVER} --task_id=0 --netlist_file=${NETLIST_FILE} --init_placement=${INIT_PLACEMENT} &
python -m circuit_training.learning.eval --root_dir=${ROOT_DIR} --variable_container_server_address=${REVERB_SERVER} --netlist_file=${NETLIST_FILE} --init_placement=${INIT_PLACEMENT} &
python -m circuit_training.learning.ppo_collect --root_dir=${ROOT_DIR} --replay_buffer_server_address=${REVERB_SERVER} --variable_container_server_address=${REVERB_SERVER} --task_id=1 --netlist_file=${NETLIST_FILE} --init_placement=${INIT_PLACEMENT} &
python -m circuit_training.learning.ppo_collect --root_dir=${ROOT_DIR} --replay_buffer_server_address=${REVERB_SERVER} --variable_container_server_address=${REVERB_SERVER} --task_id=2 --netlist_file=${NETLIST_FILE} --init_placement=${INIT_PLACEMENT}