{
    "activation": "relu",
    "attention_dropout": 0.005515988545365018,
    "batch_size": 512,
    "d_token": 252,
    "data_loader_nprocs": 4,
    "data_path": "./datasets",
    "data_set": "mnist_embedded",
    "encoder_type": "linear_flatten",
    "eta_min": 0,
    "exp_cache_cadence": 20,
    "exp_cadence_type": "improvement",
    "exp_patience": 16,
    "exp_train_total_epochs": 200,
    "exp_warmup": 0,
    "final_lr": 0,
    "final_weight_decay": 0,
    "initialization": "kaiming",
    "lr": 0.000583189482623248,
    "model_name": "autoint",
    "n_heads": 2,
    "n_layers": 2,
    "residual_dropout": 0.09140924109423593,
    "start_lr": 0,
    "test_size_ratio": 0.1,
    "using_embedding": true,
    "val_size_ratio": 0.1,
    "weight_decay": 5.1072854745562606e-05,
    "script_path": "run_benchmark.py",
    "random": true
}