,name,seed_everything,test_prompt_length,max_pred_length,lr,adversarial_training,max_length,batch_size,model,dim_model,num_heads,dim_feedforward,num_decoder_layers,dropout_p,layer_norm_eps,lstm_embedding_dim,lstm_hidden_dim,lstm_num_layers,lstm_dropout,linear_embedding_dim,linear_bias,linear_dim,mamba_d_model,mamba_d_state,mamba_d_conv,mamba_n_layers,min_train_loss,min_train_loss_step,max_val_accuracy,max_val_accuracy_step,min_val_loss,min_val_loss_step,min_val_kl,min_val_kl_step,rule_1_accuracy4min_val_loss,rule_2_accuracy4min_val_loss,grammatical_accuracy4min_val_loss,finished4min_val_loss,ood_rule_1_accuracy4min_val_loss,ood_rule_2_completion_accuracy4min_val_loss,ood_rule_2_accuracy4min_val_loss,ood_grammatical_accuracy4min_val_loss,ood_finished4min_val_loss,sos_rule_1_accuracy4min_val_loss,sos_rule_2_accuracy4min_val_loss,sos_grammatical_accuracy4min_val_loss,sos_finished4min_val_loss
0,mild-sweep-17,90889,8,300,0.002,False,256,128,linear,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,8.996963515528478e-06,129,0.5096668004989624,1,2.491274356842041,0,-0.037897493690252304,25,0.20000000298023224,1,0.20000000298023224,1,0.2749004065990448,1,0.01593625545501709,0,1,1,1,1,1
1,generous-sweep-11,22678,8,300,0.002,False,256,128,linear,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,1.0994385775120463e-05,129,0.505836546421051,1,2.7866599559783936,0,-0.03789549693465233,25,0.20000000298023224,1,0.20000000298023224,1,0.2749004065990448,1,0.01593625545501709,0,1,1,1,1,1
2,confused-sweep-15,93006,8,300,0.002,False,256,128,linear,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,1.085731310013216e-05,129,0.5096971988677979,25,2.5019068717956543,0,-0.03789563477039337,25,0.20000000298023224,1,0.20000000298023224,1,0.2749004065990448,1,0.01593625545501709,0,1,1,1,1,1
3,desert-sweep-9,28056,8,300,0.002,False,256,128,linear,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,1.0715491043811198e-05,129,0.5059581995010376,25,2.6423065662384033,0,-0.03789577633142471,25,0.20000000298023224,1,0.20000000298023224,1,0.2749004065990448,1,0.01593625545501709,0,1,1,1,1,1
4,polished-sweep-13,99030,8,300,0.002,False,256,128,linear,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,1.1268013622611761e-05,129,0.505836546421051,1,2.567272663116455,0,-0.03789522498846054,25,0.20000000298023224,1,0.20000000298023224,1,0.2749004065990448,1,0.01593625545501709,0,1,1,1,1,1
5,giddy-sweep-8,95919,8,300,0.002,False,256,128,linear,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,1.1308781722618733e-05,129,0.505836546421051,1,2.855391502380371,0,-0.03789518401026726,25,0.20000000298023224,1,0.20000000298023224,1,0.2749004065990448,1,0.01593625545501709,0,1,1,1,1,1
6,swept-sweep-6,71515,8,300,0.002,False,256,128,linear,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,8.776529284659773e-06,129,0.5058669447898865,13,2.4007225036621094,0,-0.03789771348237991,25,0.20000000298023224,1,0.20000000298023224,1,0.2749004065990448,1,0.01593625545501709,0,1,1,1,1,1
7,astral-sweep-7,58154,8,300,0.002,False,256,128,linear,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,1.109661752707325e-05,129,0.5135274529457092,21,2.3776373863220215,0,-0.03789539635181427,25,0.20000000298023224,1,0.20000000298023224,1,0.2749004065990448,1,0.01593625545501709,0,1,1,1,1,1
8,peach-sweep-5,90694,8,300,0.002,False,256,128,linear,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,1.1573446499824058e-05,129,0.5058669447898865,16,2.700862169265747,0,-0.03789491951465607,25,0.20000000298023224,1,0.20000000298023224,1,0.2749004065990448,1,0.01593625545501709,0,1,1,1,1,1
9,effortless-sweep-2,77916,8,300,0.002,False,256,128,linear,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,1.0535590263316408e-05,129,0.5172969102859497,22,2.4117789268493652,0,-0.03789595514535904,25,0.20000000298023224,1,0.20000000298023224,1,0.2749004065990448,1,0.01593625545501709,0,1,1,1,1,1
10,dark-sweep-3,22130,8,300,0.002,False,256,128,linear,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,9.614831469662022e-06,129,0.5096971988677979,1,2.419177770614624,0,-0.03789687529206276,25,0.20000000298023224,1,0.20000000298023224,1,0.2749004065990448,1,0.01593625545501709,0,1,1,1,1,1
11,tough-sweep-4,903,8,300,0.002,False,256,128,linear,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,1.1357969924574718e-05,129,0.5134970545768738,4,2.4826276302337646,0,-0.03789513558149338,25,0.20000000298023224,1,0.20000000298023224,1,0.2749004065990448,1,0.01593625545501709,0,1,1,1,1,1
