,name,seed_everything,test_prompt_length,max_pred_length,lr,adversarial_training,max_length,batch_size,model,dim_model,num_heads,dim_feedforward,num_decoder_layers,dropout_p,layer_norm_eps,lstm_embedding_dim,lstm_hidden_dim,lstm_num_layers,lstm_dropout,linear_embedding_dim,linear_bias,linear_dim,mamba_d_model,mamba_d_state,mamba_d_conv,mamba_n_layers,min_train_loss,min_train_loss_step,max_val_accuracy,max_val_accuracy_step,min_val_loss,min_val_loss_step,min_val_kl,min_val_kl_step,rule_1_accuracy4min_val_loss,rule_2_accuracy4min_val_loss,grammatical_accuracy4min_val_loss,finished4min_val_loss,ood_rule_1_accuracy4min_val_loss,ood_rule_2_completion_accuracy4min_val_loss,ood_rule_2_accuracy4min_val_loss,ood_grammatical_accuracy4min_val_loss,ood_finished4min_val_loss,sos_rule_1_accuracy4min_val_loss,sos_rule_2_accuracy4min_val_loss,sos_grammatical_accuracy4min_val_loss,sos_finished4min_val_loss
0,classic-sweep-11,75227,8,300,0.002,False,256,128,transformer,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.03770262002944946,339,0.9923851490020752,14,0.03925536200404167,11,0.0013488754630088806,11,0.5234375,1,0.5234375,1.0,0.5625,0,0,0,1.0,0.0,0,0.0,0.0
1,frosty-sweep-15,19587,8,300,0.002,False,256,128,transformer,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.037975966930389404,260,0.9924002885818481,0,0.03913416713476181,16,0.00122767873108387,16,0.4296875,1,0.4296875,1.0,0.328125,0,0,0,1.0,0.0,0,0.0,0.0
2,light-sweep-12,8678,8,300,0.002,False,256,128,transformer,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.03807671740651131,433,0.9924079179763794,9,0.03944062069058418,15,0.001534133218228817,15,0.8046875,1,0.8046875,1.0,0.6171875,0,0,0,1.0,0.0,0,0.0,0.0
3,ancient-sweep-14,77800,8,300,0.002,False,256,128,transformer,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.038124531507492065,338,0.9923394918441772,0,0.039328157901763916,7,0.0014216722920536995,7,0.0,0,0.0,0.0,0.0,0,0,0,0.0,0.0,0,0.0,0.0
4,confused-sweep-13,72273,8,300,0.002,False,256,128,transformer,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.038290031254291534,398,0.9923698902130127,0,0.03920109570026398,11,0.0012946110218763351,11,0.0,0,0.0,0.0,0.0,0,0,0,0.0,0.0,0,0.0,0.0
5,cerulean-sweep-5,155,8,300,0.002,False,256,128,transformer,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.03793204575777054,408,0.9923622608184814,0,0.039580509066581726,11,0.0016740262508392334,11,0.703125,1,0.703125,1.0,0.578125,0,0,0,1.0,0.0,0,0.0,0.0
6,silver-sweep-7,71189,8,300,0.002,False,256,128,transformer,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.03791540116071701,258,0.9923850893974304,20,0.03939199820160866,5,0.0014855125918984413,5,0.6796875,1,0.6796875,1.0,0.8046875,0,0,0,1.0,0.0,1,0.0,0.0390625
7,deft-sweep-2,92085,8,300,0.002,False,256,128,transformer,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.03802008554339409,305,0.9924078583717346,0,0.039073020219802856,17,0.001166531816124916,17,0.609375,1,0.609375,1.0,0.65625,0,0,0,1.0,0.0,0,0.0,0.0
8,silver-sweep-3,666,8,300,0.002,False,256,128,transformer,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.0383472815155983,361,0.9923926591873169,0,0.03930718079209328,16,0.001400696113705635,16,0.2083333283662796,1,0.2083333283662796,0.5625,0.7549020051956177,0,0,0,0.796875,0.0,0,0.0,0.0
9,sweet-sweep-9,66258,8,300,0.002,False,256,128,transformer,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.03834685683250427,408,0.9923850297927856,9,0.03931829333305359,6,0.0014118067920207977,6,0.5625,1,0.5625,1.0,0.53125,0,0,0,1.0,1.0,1,1.0,1.0
10,young-sweep-4,12480,8,300,0.002,False,256,128,transformer,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.038311272859573364,233,0.9923850893974304,0,0.03941444680094719,7,0.0015079621225595474,7,0.0,0,0.0,0.0,0.0,0,0,0,0.0,0.0,0,0.0,0.0
11,unique-sweep-8,17470,8,300,0.002,False,256,128,transformer,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.038265883922576904,382,0.9924306869506836,0,0.039003416895866394,17,0.001096930354833603,17,0.0,0,0.0,0.0,0.0,0,0,0,0.0,0.0,0,0.0,0.0
12,desert-sweep-1,46926,8,300,0.002,False,256,128,transformer,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.03827069327235222,268,0.9923850297927856,0,0.038957685232162476,14,0.0010511986911296844,14,0.6015625,1,0.6015625,1.0,0.5703125,0,0,0,1.0,0.0,0,0.0,0.0
13,soft-sweep-6,41776,8,300,0.002,False,256,128,transformer,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,0.03820550814270973,191,0.992331862449646,0,0.039206892251968384,11,0.001300404779613018,11,0.0,0,0.0,0.0,0.0,0,0,0,0.0,0.0,0,0.0,0.0
