{
    "attention_dropout": 0.3333567625094862,
    "attention_n_heads": 4,
    "batch_size": 512,
    "d_block": 128,
    "data_loader_nprocs": 4,
    "data_path": "./datasets",
    "data_set": "higgs_embedded",
    "encoder_type": "linear_flatten",
    "eta_min": 0,
    "exp_cache_cadence": 20,
    "exp_cadence_type": "improvement",
    "exp_device": null,
    "exp_final_lr": 0,
    "exp_n_runs": 1,
    "exp_patience": 16,
    "exp_scheduler": true,
    "exp_train_total_epochs": 200,
    "exp_warmup": 10,
    "exp_weight_decay_scheduler": true,
    "ffn_d_hidden": 64,
    "ffn_dropout": 0.48127559448918134,
    "final_lr": 0.001,
    "final_weight_decay": 0,
    "full_dataset_cuda": false,
    "gradient_clipping": 1,
    "ipe_scale": 1,
    "load_from_checkpoint": false,
    "load_path": null,
    "log_tensorboard": false,
    "lr": 0.0002251077661208916,
    "mock": false,
    "model_amp": false,
    "model_dtype": "float32",
    "model_name": "fttransformer",
    "mp_distributed": false,
    "mp_gpus": 1,
    "mp_nodes": 1,
    "mp_nr": 0,
    "n_blocks": 12,
    "np_seed": 42,
    "output_file": "output.json",
    "pin_memory": true,
    "random_state": 42,
    "res_dir": "./",
    "residual_dropout": 0.14651019023596132,
    "start_lr": 0,
    "T_max": 10,
    "test": false,
    "test_size_ratio": 0.1,
    "torch_seed": 42,
    "using_embedding": true,
    "val_size_ratio": 0.1,
    "verbose": false,
    "weight_decay": 0.00006937410902927194,
    "script_path": "run_benchmark.py",
    "random": true
}