wandb_project_name=permutation

task=index
# task=square_mod19
# task=relu
# task=prod
encoding_method=standard
epochs=10
target_len=13
layer_num=4
head_num=4
d_model=256
dim_feedforward=$((d_model * 4))
batch_size=128

count=3
# perm_name="forward"
# perm_name="perm_v1"
# perm_name="forward"
# perm_name="reverse"
perm_name="discovered"

# Forward order
# permutation_str="0,1,2,3,4"
permutation_str="0,1,2,3,4,5,6,7,8,9,10,11,12"
# permutation_str="0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24"
# permutation_str="0,1,2,3,4,5,6,7,8,9,10,11,12"

# Reverse order
# permutation_str="4,3,2,1,0"
# permutation_str="12,11,10,9,8,7,6,5,4,3,2,1,0"
# permutation_str="9,8,7,6,5,4,3,2,1,0"
# permutation_str="34,33,32,31,30,29,28,27,26,25,24,23,22,21,20,19,18,17,16,15,14,13,12,11,10,9,8,7,6,5,4,3,2,1,0"
# permutation_str="12,11,10,9,8,7,6,5,4,3,2,1,0"

# permutation_str="0,1,9,2,3,4,5,6,7,8"
# relu, n=7
# permutation_str="2,3,4,5,0,6,1"
# relu, n=10
# permutation_str="4,5,6,7,8,9,0,1,2,3"

# # square mod 19 n=5
# permutation_str="2,1,0,4,3"


# # square mod 19 n=10
# permutation_str="3,4,5,6,7,8,9,1,0,2" # Genetic algorithm (data.test)
# permutation_str="4,5,6,7,8,9,0,1,2,3"

# # square mod 19 n=20
# permutation_str="9,10,11,12,13,14,2,3,4,5,6,15,16,17,18,19,0,1,7,8" # Genetic algorithm (data.test)


# # relu n=5
# permutation_str="2,1,0,4,3"
# permutation_str="4,0,1,2,3"

# # relu n=10
# permutation_str="0,1,2,3,4,5,6,7,8,9"

# # relu n=20
# permutation_str="6,7,9,8,12,11,13,18,17,14,16,15,19,5,10,1,0,3,4,2"

# # index n=13, m=2
# permutation_str="0,1,2,3,4,10,9,5,6,12,11,7,8"
# permutation_str="4,3,5,6,7,8,9,10,11,12,1,0,2"


nvars=1
field=ZZ
max_coefficient=500
max_degree=20
max_seq_len=128

exp_name=permutation
data_class=small
# data_name="n=${target_len}/data"
# data_name="n=5/data-inv"
data_name="n=${target_len}_m=2/data"
data_path=data/data/${data_class}/${task}/${data_name}

run_name=${exp_name}_${data_class}_${task}_n=${target_len}_${perm_name}
run_name_sub=${exp_name}_${field}_n=${target_len}_bs=${batch_size}_L=${layer_num}_H=${head_num}_D=${d_model}_DFF=${dim_feedforward}_E=${epochs}_${perm_name}
save_path=data/results/${data_class}/${task}/${run_name_sub}

mkdir -p $save_path
CUDA_VISIBLE_DEVICES=$count nohup python3 src/main_training_permutation.py  --save_path $save_path \
                                            --data_path $data_path \
                                            --task $task \
                                            --epochs $epochs \
                                            --target_len $target_len \
                                            --num_batch $batch_size \
                                            --num_encoder_layers $layer_num \
                                            --num_decoder_layers $layer_num \
                                            --nhead $head_num \
                                            --exp_name $wandb_project_name \
                                            --exp_id $run_name \
                                            --num_variables $nvars \
                                            --field $field \
                                            --max_coefficient $max_coefficient \
                                            --max_degree $max_degree \
                                            --model "gpt2" \
                                            --d_model $d_model \
                                            --dim_feedforward $dim_feedforward \
                                            --max_sequence_length $max_seq_len \
                                            --permutation_str $permutation_str > $save_path/run.log 2>&1 &