{
    "activation": "relu",
    "attention_dropout": 0.07290552721482114,
    "batch_size": 512,
    "d_token": 56,
    "data_loader_nprocs": 4,
    "data_path": "./datasets",
    "data_set": "higgs_embedded",
    "encoder_type": "linear_per_feature",
    "eta_min": 0,
    "exp_cache_cadence": 20,
    "exp_cadence_type": "improvement",
    "exp_device": null,
    "exp_n_runs": 1,
    "exp_patience": 16,
    "exp_scheduler": true,
    "exp_train_total_epochs": 200,
    "exp_warmup": 0,
    "exp_weight_decay_scheduler": true,
    "final_lr": 0,
    "final_weight_decay": 0,
    "full_dataset_cuda": false,
    "gradient_clipping": 1,
    "initialization": "kaiming",
    "ipe_scale": 1,
    "load_from_checkpoint": false,
    "load_path": null,
    "log_tensorboard": false,
    "lr": 0.00065080325132651,
    "mock": false,
    "model_amp": false,
    "model_dtype": "float32",
    "model_name": "autoint",
    "mp_distributed": false,
    "mp_gpus": 1,
    "mp_nodes": 1,
    "mp_nr": 0,
    "n_heads": 2,
    "n_layers": 7,
    "np_seed": 42,
    "output_file": "output.json",
    "pin_memory": true,
    "random_state": 42,
    "res_dir": "./",
    "residual_dropout": 0.043141062383989105,
    "start_lr": 0,
    "T_max": 10,
    "test": false,
    "test_size_ratio": 0.1,
    "torch_seed": 42,
    "using_embedding": true,
    "val_size_ratio": 0.1,
    "verbose": false,
    "weight_decay": 0.00005395155177026821,
    "script_path": "run_benchmark.py",
    "random": true
}