"epoch","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - _step","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - _step__MIN","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - _step__MAX","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_128_epoch","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_128_epoch__MIN","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_128_epoch__MAX","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_16_epoch","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_16_epoch__MIN","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_16_epoch__MAX","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_1_epoch","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_1_epoch__MIN","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_1_epoch__MAX","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_256_epoch","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_256_epoch__MIN","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_256_epoch__MAX","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_2_epoch","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_2_epoch__MIN","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_2_epoch__MAX","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_32_epoch","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_32_epoch__MIN","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_32_epoch__MAX","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_4_epoch","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_4_epoch__MIN","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_4_epoch__MAX","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_512_epoch","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_512_epoch__MIN","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_512_epoch__MAX","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_64_epoch","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_64_epoch__MIN","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_64_epoch__MAX","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_8_epoch","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_8_epoch__MIN","tag_itr_attention_head_12_dim_384_bs_64_weight_decay_0.01_lr_0.0005_use_compile_True_train_sudoku-extreme_test_sudoku-extreme_num_layers_1_num_rep_attn_4_use_mpc_False_use_transformer_False - test_board_acc_32_8_epoch__MAX"
"0","2703.5","83","13283","0.9100550413131714","0.9100550413131714","0.9100550413131714","0.8157320618629456","0.8157320618629456","0.8157320618629456","0.6323061585426331","0.6323061585426331","0.6323061585426331","0.9332816004753113","0.9332816004753113","0.9332816004753113","0.6851382851600647","0.6851382851600647","0.6851382851600647","0.851908266544342","0.851908266544342","0.851908266544342","0.7331619262695312","0.7331619262695312","0.7331619262695312","0.9522294402122498","0.9522294402122498","0.9522294402122498","0.883446216583252","0.883446216583252","0.883446216583252","0.7760530114173889","0.7760530114173889","0.7760530114173889"