{
  "train_data_size": 200000,
  "test_data_size": 1000,
  "seq_len": 13,
  "data_min": 20,
  "data_max": 100,
  "data_mode": ["train", "test"],
  "data_percent": [0.5, 0.5],
  "data_name": ["train", "test"],
  "data_mask": [0, 1],
  "data_show": [1, 1],
  "target": "single_chain_search",
  "batch_size": 100,
  "vocab_size": 201,
  "max_pos": 20,
  "d_model": 400,
  "d_feedforward": 1200,
  "d_k": 64,
  "d_v": 64,
  "n_layers": 3,
  "n_heads": 1,
  "clip": 1,
  "n_epoch": 4000,
  "lr": 2e-05,
  "lr_decay_step": 1000,
  "lr_decay_rate": 1,
  "seed": 1,
  "scheduler": "GradualWarmupScheduler_CosineAnnealingLR",
  "model": "GPT",
  "optim": "AdamW",
  "save_model_epoch": 5,
  "print_loss_epoch": 1,
  "print_acc_epoch": 5,
  "plot_loss_acc_epoch": 10,
  "prefix": " ",
  "suffix": "3L1H",
  "dir_suffix": "2_step_reasoning",
  "train_method": " ",
  "n_batch": 10000,
  "gen_data_mode": "fix",
  "working_dir": "./result/2_step_reasoning/single_chain_search-seed_1-N_200000-3L1H",
  "use_mod_list_specific": "True",
  "optim_T_max": "4000",
  "optim_eta_min": "1e-5",
  "optim_multiplier": "5",
  "optim_total_epoch": "400",
  "train_datasize_train": 100000,
  "test_datasize_train": 500,
  "train_datasize_test": 100000,
  "test_datasize_test": 500
}
