### Create Graph and Data
# cd data/graph
# python create_graph.py
# python prepare_minigpt.py --type simple
# python prepare_minigpt.py --type aug


### SFT
# CUDA_VISIBLE_DEVICES=0 python pretrain.py --dataset graph

### Experiment in Main Paper
# CUDA_VISIBLE_DEVICES=0 python pg_train.py --dataset graph --num_nodes 100 --n_layer 1 --n_head 1 --n_embd 120 --max_iters 100000 --load_ckpt_num 10000 --save_interval 2000 --gen_temp 1.0 --kl_constant 0.0001 --train_type simple --eval_interval 10000 --lr 3e-4

# python q_learning_train.py --device cuda:0 --epsilon 0.1 --n_layer 1 --n_head 1 --n_embd 120 --load_ckpt_num 10000 --lr 2e-4 --soft False --reward_type step --dataset graph --num_episodes 200000 --train_type simple

### Experiment in Appendix
# CUDA_VISIBLE_DEVICES=0 python pg_train.py --dataset graph --num_nodes 100 --n_layer 1 --n_head 1 --n_embd 120 --max_iters 100000 --load_ckpt_num 10000 --save_interval 2000 --gen_temp 1.0 --kl_constant 0.0001 --train_type aug --eval_interval 10000 --lr 3e-4

# python q_learning_train.py --device cuda:0 --epsilon 0.1 --n_layer 1 --n_head 1 --n_embd 120 --load_ckpt_num 10000 --lr 2e-4 --soft False --reward_type step --dataset graph --num_episodes 200000 --train_type aug