{
    "attention_dropout": 0.4259193079814802,
    "attention_n_heads": 8,
    "batch_size": 512,
    "d_block": 32,
    "data_loader_nprocs": 4,
    "data_path": "./datasets",
    "data_set": "mnist",
    "encoder_type": "linear_flatten",
    "exp_cache_cadence": 20,
    "exp_cadence_type": "improvement",
    "exp_final_lr": 0,
    "exp_patience": 16,
    "exp_train_total_epochs": 200,
    "exp_warmup": 10,
    "ffn_d_hidden": 256,
    "ffn_dropout": 0.010527318594966806,
    "final_weight_decay": 0,
    "lr": 7.968468205343073e-05,
    "model_name": "fttransformer",
    "n_blocks": 8,
    "residual_dropout": 0.10878389352934607,
    "start_lr": 0,
    "test_size_ratio": 0.1,
    "using_embedding": true,
    "val_size_ratio": 0.1,
    "weight_decay": 5.472572212295389e-07,
    "script_path": "run_benchmark.py",
    "random": true
}