,name,seed_everything,test_prompt_length,max_pred_length,lr,adversarial_training,max_length,batch_size,model,dim_model,num_heads,dim_feedforward,num_decoder_layers,dropout_p,layer_norm_eps,lstm_embedding_dim,lstm_hidden_dim,lstm_num_layers,lstm_dropout,linear_embedding_dim,linear_bias,linear_dim,mamba_d_model,mamba_d_state,mamba_d_conv,mamba_n_layers,min_train_loss,min_train_loss_step,max_val_accuracy,max_val_accuracy_step,min_val_loss,min_val_loss_step,min_val_kl,min_val_kl_step,rule_1_accuracy4min_val_loss,rule_2_accuracy4min_val_loss,grammatical_accuracy4min_val_loss,finished4min_val_loss,ood_rule_1_accuracy4min_val_loss,ood_rule_2_completion_accuracy4min_val_loss,ood_rule_2_accuracy4min_val_loss,ood_grammatical_accuracy4min_val_loss,ood_finished4min_val_loss,sos_rule_1_accuracy4min_val_loss,sos_rule_2_accuracy4min_val_loss,sos_grammatical_accuracy4min_val_loss,sos_finished4min_val_loss
0,iconic-sweep-5,74552,8,300,0.002,False,256,128,linear,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,3.615689345148887e-11,18,0.5171905755996704,0,4.686491966247559,6,-0.03790648654103279,1,0.5,1,0.5,1,0.5,0,0,0,1,1,0,0,1
1,pretty-sweep-3,78926,8,300,0.002,False,256,128,linear,10,5,1024,7,0.1,0.006,10,64,5,0.4,10,True,256,32,16,8,10,7.417664572850757e-12,20,0.5198656320571899,0,4.489923000335693,7,-0.03790648654103279,1,0.5,1,0.5,1,0.5,0,0,0,1,1,0,0,1
