,name,seed_everything,test_prompt_length,max_pred_length,lr,adversarial_training,max_length,batch_size,model,dim_model,num_heads,dim_feedforward,num_decoder_layers,dropout_p,layer_norm_eps,lstm_embedding_dim,lstm_hidden_dim,lstm_num_layers,lstm_dropout,linear_embedding_dim,linear_bias,linear_dim,mamba_d_model,mamba_d_state,mamba_d_conv,mamba_n_layers,min_train_loss,min_train_loss_step,max_val_accuracy,max_val_accuracy_step,min_val_loss,min_val_loss_step,min_val_kl,min_val_kl_step,rule_1_accuracy4min_val_loss,rule_2_accuracy4min_val_loss,grammatical_accuracy4min_val_loss,finished4min_val_loss,ood_rule_1_accuracy4min_val_loss,ood_rule_2_completion_accuracy4min_val_loss,ood_rule_2_accuracy4min_val_loss,ood_grammatical_accuracy4min_val_loss,ood_finished4min_val_loss,sos_rule_1_accuracy4min_val_loss,sos_rule_2_accuracy4min_val_loss,sos_grammatical_accuracy4min_val_loss,sos_finished4min_val_loss
0,sleek-sweep-3,22226,8,300,0.002,False,256,128,linear,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,1.4177917173618937e-10,303,0.505585789680481,0,5.067790985107422,0,-0.03790648281574249,10,0.375,1,0.375,1,0.59375,0,0,0,1,1,0,0,1
1,eager-sweep-4,45064,8,300,0.002,False,256,128,linear,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,2.2819268696849804e-10,226,0.4964205324649811,15,5.014878749847412,0,-0.0379064716398716,23,0.4140625,1,0.4140625,1,0.4453125,0,0,0,1,1,0,0,1
2,lucky-sweep-5,19742,8,300,0.002,False,256,128,linear,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,3.581794236207081e-11,453,0.49892082810401917,10,4.919543266296387,0,-0.037906479090452194,21,0.421875,1,0.421875,1,0.5703125,0,0,0,1,1,0,0,1
3,chocolate-sweep-6,59554,8,300,0.002,False,256,128,linear,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,2.088676592792993e-10,258,0.5096592307090759,0,4.89928674697876,0,-0.03790643811225891,12,0.421875,1,0.421875,1,0.546875,0,0,0,1,1,0,0,1
4,logical-sweep-2,92433,8,300,0.002,False,256,128,linear,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,2.2791954434886463e-10,456,0.4934566617012024,17,5.147296905517578,6,-0.037906449288129807,10,0.4375,1,0.4375,1,0.515625,0,0,0,1,1,0,0,1
