{
    "ednet": [
        {
            "fold": 0,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.05,
            "loss2": 0.5,
            "final_fc_dim2": 64,
            "loss1": 0.5,
            "d_model": 64,
            "num_attn_heads": 8,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.001
        },
        {
            "fold": 4,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 64,
            "nheads": 4,
            "dropout": 0.05,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        },
        {
            "fold": 3,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.3,
            "loss2": 0.5,
            "final_fc_dim2": 64,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 8,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        },
        {
            "fold": 1,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.1,
            "loss2": 0.5,
            "final_fc_dim2": 64,
            "loss1": 0.5,
            "d_model": 64,
            "num_attn_heads": 8,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 64,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.001
        },
        {
            "fold": 2,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.1,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 8,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 64,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        }
    ],
    "nips_task34": [
        {
            "fold": 3,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.3,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 64,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.001
        },
        {
            "fold": 4,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.3,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 64,
            "num_attn_heads": 8,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.001
        },
        {
            "fold": 0,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.3,
            "loss2": 0.5,
            "final_fc_dim2": 64,
            "loss1": 0.5,
            "d_model": 64,
            "num_attn_heads": 8,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.001
        },
        {
            "fold": 1,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.3,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 64,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.001
        },
        {
            "fold": 2,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.3,
            "loss2": 0.5,
            "final_fc_dim2": 64,
            "loss1": 0.5,
            "d_model": 64,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.001
        }
    ],
    "statics2011": [
        {
            "fold": 1,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.5,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 42,
            "final_fc_dim": 256,
            "n_blocks": 2,
            "start": 50,
            "learning_rate": 0.001
        },
        {
            "fold": 0,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.3,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 8,
            "num_layers": 2,
            "seed": 42,
            "final_fc_dim": 256,
            "n_blocks": 2,
            "start": 50,
            "learning_rate": 0.001
        },
        {
            "fold": 4,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 64,
            "nheads": 4,
            "dropout": 0.5,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 8,
            "num_layers": 2,
            "seed": 42,
            "final_fc_dim": 256,
            "n_blocks": 1,
            "start": 50,
            "learning_rate": 0.001
        },
        {
            "fold": 3,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 64,
            "nheads": 4,
            "dropout": 0.5,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 8,
            "num_layers": 2,
            "seed": 42,
            "final_fc_dim": 256,
            "n_blocks": 1,
            "start": 50,
            "learning_rate": 0.001
        },
        {
            "fold": 2,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.3,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 42,
            "final_fc_dim": 256,
            "n_blocks": 2,
            "start": 50,
            "learning_rate": 0.001
        }
    ],
    "poj": [
        {
            "fold": 4,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 64,
            "nheads": 4,
            "dropout": 0.3,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 8,
            "num_layers": 2,
            "seed": 42,
            "final_fc_dim": 256,
            "n_blocks": 2,
            "start": 50,
            "learning_rate": 0.0001
        },
        {
            "fold": 1,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.5,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 64,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        },
        {
            "fold": 0,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 64,
            "nheads": 4,
            "dropout": 0.3,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        },
        {
            "fold": 3,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 64,
            "nheads": 4,
            "dropout": 0.3,
            "loss2": 0.5,
            "final_fc_dim2": 64,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 8,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 2,
            "start": 50,
            "learning_rate": 0.0001
        },
        {
            "fold": 2,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.5,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 64,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 42,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        }
    ],
    "algebra2005": [
        {
            "fold": 3,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.1,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 42,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        },
        {
            "fold": 1,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.05,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 42,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        },
        {
            "fold": 0,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.1,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 42,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        },
        {
            "fold": 2,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 64,
            "nheads": 4,
            "dropout": 0.1,
            "loss2": 0.5,
            "final_fc_dim2": 64,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        },
        {
            "fold": 4,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.1,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 1e-05
        }
    ],
    "assist2009": [
        {
            "fold": 4,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 64,
            "nheads": 4,
            "dropout": 0.1,
            "loss2": 0.5,
            "final_fc_dim2": 64,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 42,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        },
        {
            "fold": 0,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 64,
            "nheads": 4,
            "dropout": 0.1,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 42,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        },
        {
            "fold": 1,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.3,
            "loss2": 0.5,
            "final_fc_dim2": 64,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 42,
            "final_fc_dim": 64,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        },
        {
            "fold": 2,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.3,
            "loss2": 0.5,
            "final_fc_dim2": 64,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 42,
            "final_fc_dim": 64,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        },
        {
            "fold": 3,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.3,
            "loss2": 0.5,
            "final_fc_dim2": 64,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        }
    ],
    "bridge2algebra2006": [
        {
            "fold": 3,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.1,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 8,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        },
        {
            "fold": 0,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.1,
            "loss2": 0.5,
            "final_fc_dim2": 64,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 42,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 1e-05
        },
        {
            "fold": 4,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 64,
            "nheads": 4,
            "dropout": 0.1,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 42,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 1e-05
        },
        {
            "fold": 1,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 64,
            "nheads": 4,
            "dropout": 0.1,
            "loss2": 0.5,
            "final_fc_dim2": 64,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 8,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        },
        {
            "fold": 2,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 64,
            "nheads": 4,
            "dropout": 0.1,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 8,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        }
    ],
    "assist2015": [
        {
            "fold": 4,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.1,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 8,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 1e-05
        },
        {
            "fold": 0,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.1,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 42,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 1e-05
        },
        {
            "fold": 2,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.05,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 4,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 1e-05
        },
        {
            "fold": 3,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.1,
            "loss2": 0.5,
            "final_fc_dim2": 256,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 8,
            "num_layers": 2,
            "seed": 3407,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        },
        {
            "fold": 1,
            "emb_type": "qid",
            "loss3": 0.5,
            "d_ff": 256,
            "nheads": 4,
            "dropout": 0.1,
            "loss2": 0.5,
            "final_fc_dim2": 64,
            "loss1": 0.5,
            "d_model": 256,
            "num_attn_heads": 8,
            "num_layers": 2,
            "seed": 42,
            "final_fc_dim": 256,
            "n_blocks": 4,
            "start": 50,
            "learning_rate": 0.0001
        }
    ]
}