{
    "val_metrics": [
        {
            "mnist_val_loss": 0.12449716031551361,
            "lr": 5.392560706241056e-05,
            "mnist_val_accuracy": 0.9675714373588562,
            "mnist_val_precision": 0.9683455228805542,
            "mnist_val_recall": 0.9675714373588562,
            "mnist_val_f1-score": 0.9675799608230591,
            "mnist_val_support": 503.7439880371094,
            "mnist_val_score": 0.9675714373588562
        }
    ],
    "test_metrics": [
        {
            "mnist_test_loss": 0.11310623586177826,
            "lr": 5.392560706241056e-05,
            "mnist_test_accuracy": 0.9700000286102295,
            "mnist_test_precision": 0.9705820083618164,
            "mnist_test_recall": 0.9700000286102295,
            "mnist_test_f1-score": 0.9700143933296204,
            "mnist_test_support": 503.7439880371094,
            "mnist_test_score": 0.9700000286102295
        }
    ],
    "args": {
        "test": false,
        "mock": false,
        "res_dir": "./",
        "data_path": "./datasets",
        "data_set": "mnist",
        "test_size_ratio": 0.1,
        "val_size_ratio": 0.1,
        "random_state": 7348,
        "full_dataset_cuda": false,
        "verbose": false,
        "exp_n_runs": 1,
        "exp_device": null,
        "np_seed": 38217,
        "torch_seed": 52963,
        "random": true,
        "output_file": "ft_transformer_mnist_tuned/output_16.json",
        "batch_size": 512,
        "exp_train_total_epochs": 200,
        "exp_patience": 16,
        "log_tensorboard": false,
        "exp_cadence_type": "improvement",
        "exp_cache_cadence": 20,
        "exp_scheduler": true,
        "exp_weight_decay_scheduler": true,
        "start_lr": 0.0,
        "lr": 7.968468205343073e-05,
        "final_lr": 0.001,
        "T_max": 10,
        "eta_min": 0.0,
        "exp_warmup": 10,
        "weight_decay": 5.472572212295389e-07,
        "final_weight_decay": 0.0,
        "ipe_scale": 1.0,
        "gradient_clipping": 1.0,
        "mp_distributed": false,
        "mp_nodes": 1,
        "mp_gpus": 1,
        "mp_nr": 0,
        "pin_memory": true,
        "using_embedding": true,
        "model_name": "fttransformer",
        "model_dtype": "float32",
        "data_loader_nprocs": 4,
        "load_from_checkpoint": false,
        "load_path": null,
        "model_amp": false,
        "task_type": "multi_class",
        "is_batchlearning": true,
        "iteration": 0,
        "encoder_type": "linear_flatten",
        "d_out": 128,
        "n_blocks": 8,
        "d_block": 32,
        "attention_n_heads": 8,
        "attention_dropout": 0.4259193079814802,
        "ffn_d_hidden": 256,
        "ffn_d_hidden_multiplier": null,
        "ffn_dropout": 0.010527318594966806,
        "residual_dropout": 0.10878389352934607,
        "input_embed_dim": 28,
        "input_dim": 28,
        "out_dim": 10,
        "summary_input": [
            512,
            28,
            28
        ],
        "dataset_name": "mnist",
        "iterations_per_epoch": 110,
        "num_epochs": 200,
        "cardinalities": [],
        "n_cont_features": 28
    },
    "profiling_info": [
        {
            "function": "warnings.py:503(__exit__)",
            "call_count": 187920,
            "total_time": 0.19898694500000003,
            "cumulative_time": 0.238236086
        },
        {
            "function": "_parser.py:86(opengroup)",
            "call_count": 1,
            "total_time": 5.772e-06,
            "cumulative_time": 8.182e-06
        },
        {
            "function": "_parser.py:953(fix_flags)",
            "call_count": 1,
            "total_time": 1.557e-06,
            "cumulative_time": 1.8030000000000001e-06
        },
        {
            "function": "_parser.py:240(__next)",
            "call_count": 11,
            "total_time": 9.097000000000001e-06,
            "cumulative_time": 9.097000000000001e-06
        },
        {
            "function": "__init__.py:179(sub)",
            "call_count": 2,
            "total_time": 3.949000000000001e-06,
            "cumulative_time": 1.9347e-05
        },
        {
            "function": "__init__.py:199(split)",
            "call_count": 38,
            "total_time": 0.000159457,
            "cumulative_time": 0.0006837750000000001
        },
        {
            "function": "__init__.py:209(findall)",
            "call_count": 884,
            "total_time": 0.004893801000000001,
            "cumulative_time": 0.023080171
        },
        {
            "function": "enum.py:807(<genexpr>)",
            "call_count": 25410,
            "total_time": 0.021277476,
            "cumulative_time": 0.021277476
        },
        {
            "function": "pathlib.py:484(_str_normcase)",
            "call_count": 74,
            "total_time": 0.000960509,
            "cumulative_time": 0.002188803
        },
        {
            "function": "warnings.py:20(_showwarnmsg_impl)",
            "call_count": 2,
            "total_time": 1.1138e-05,
            "cumulative_time": 0.0007411360000000001
        }
    ],
    "total_elapsed_time": 464.93888315400034
}