,name,seed_everything,test_prompt_length,max_pred_length,lr,adversarial_training,max_length,batch_size,model,dim_model,num_heads,dim_feedforward,num_decoder_layers,dropout_p,layer_norm_eps,lstm_embedding_dim,lstm_hidden_dim,lstm_num_layers,lstm_dropout,linear_embedding_dim,linear_bias,linear_dim,mamba_d_model,mamba_d_state,mamba_d_conv,mamba_n_layers,min_train_loss,min_train_loss_step,max_val_accuracy,max_val_accuracy_step,min_val_loss,min_val_loss_step,min_val_kl,min_val_kl_step,rule_1_accuracy4min_val_loss,rule_2_accuracy4min_val_loss,grammatical_accuracy4min_val_loss,finished4min_val_loss,ood_rule_1_accuracy4min_val_loss,ood_rule_2_completion_accuracy4min_val_loss,ood_rule_2_accuracy4min_val_loss,ood_grammatical_accuracy4min_val_loss,ood_finished4min_val_loss,sos_rule_1_accuracy4min_val_loss,sos_rule_2_accuracy4min_val_loss,sos_grammatical_accuracy4min_val_loss,sos_finished4min_val_loss
0,peach-sweep-11,12678,8,300,0.002,False,256,128,lstm,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.16843874752521515,286,0.8652495741844177,0,0.27762389183044434,0,0.23971739411354065,0,1.0,1.0,1.0,0.1875,1.0,1.0,0,0,0.265625,0,0,0,0
1,gallant-sweep-10,8021,8,300,0.002,False,256,128,lstm,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.15897980332374573,495,0.8677499294281006,0,0.27854233980178833,0,0.24063585698604584,0,0.7058823704719543,1.0,0.7058823704719543,0.6484375,0.800000011920929,0.9117646813392639,0,0,0.7109375,0,0,0,0
2,distinctive-sweep-9,38671,8,300,0.002,False,256,128,lstm,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.1817207783460617,416,0.8613812923431396,0,0.28550058603286743,0,0.24759408831596375,0,1.0,1.0,1.0,0.1796875,0.75,0.8333333730697632,0,0,0.3203125,0,0,0,0
3,trim-sweep-8,12257,8,300,0.002,False,256,128,lstm,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.1891881823539734,275,0.8711470365524292,0,0.26693084836006165,0,0.22902435064315796,0,1.0,1.0,1.0,0.484375,1.0,1.0,0,0,0.765625,1,1,1,1
4,fast-sweep-6,97222,8,300,0.002,False,256,128,lstm,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.18596035242080688,294,0.8647783994674683,0,0.28000304102897644,0,0.24209655821323395,0,0.800000011920929,1.0,0.800000011920929,0.3359375,0.6666666865348816,0.6666666865348816,0,0,0.4375,0,0,0,0
5,denim-sweep-7,81824,8,300,0.002,False,256,128,lstm,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.1819263994693756,209,0.8747188448905945,0,0.26734596490859985,0,0.22943949699401855,0,0.875,1.0,0.875,0.7265625,1.0,1.0,0,0,0.78125,0,0,0,0
6,faithful-sweep-3,91054,8,300,0.002,False,256,128,lstm,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.19107691943645477,455,0.8725149035453796,6,0.2658359408378601,0,0.22792945802211761,0,1.0,1.0,1.0,0.3984375,0.8666667342185974,1.0,0,0,0.4375,0,0,0,0
7,polar-sweep-2,11376,8,300,0.002,False,256,128,lstm,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.1801009178161621,338,0.8734116554260254,0,0.27058476209640503,0,0.23267829418182373,0,1.0,1.0,1.0,0.3828125,1.0,1.0,0,0,0.78125,0,0,0,0
8,hardy-sweep-4,61179,8,300,0.002,False,256,128,lstm,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.18696457147598267,321,0.866161584854126,0,0.27563661336898804,0,0.23773016035556793,0,0.8000000715255737,1.0,0.8000000715255737,0.3125,0.6829267740249634,1.0,0,0,0.546875,0,0,0,0
9,dazzling-sweep-5,37492,8,300,0.002,False,256,128,lstm,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.1637304723262787,419,0.8625592589378357,0,0.2878602147102356,3,0.2499537169933319,3,1.0,1.0,1.0,0.4765625,0.7142857313156128,1.0,0,0,0.5390625,1,1,1,1
10,fine-sweep-1,28398,8,300,0.002,False,256,128,lstm,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.1994350254535675,251,0.8648011684417725,0,0.2796596884727478,1,0.2417532205581665,1,1.0,1.0,1.0,0.453125,1.0,1.0,0,0,0.625,0,0,0,0
