{
    "config": {
        "base_config": {
            "data": {
                "normalization": "quantile",
                "path": "data/california_housing",
                "y_policy": "mean_std"
            },
            "model": {
                "activation": "reglu",
                "initialization": "kaiming",
                "n_heads": 8,
                "prenormalization": false
            },
            "seed": 0,
            "training": {
                "batch_size": 256,
                "eval_batch_size": 8192,
                "n_epochs": 1000000000,
                "optimizer": "adamw",
                "patience": 16
            }
        },
        "optimization": {
            "options": {
                "n_trials": 100
            },
            "sampler": {
                "seed": 0
            },
            "space": {
                "model": {
                    "attention_dropout": [
                        "uniform",
                        0.0,
                        0.5
                    ],
                    "d_ffn_factor": [
                        "$d_ffn_factor",
                        1.0,
                        4.0
                    ],
                    "d_token": [
                        "$d_token",
                        64,
                        512
                    ],
                    "ffn_dropout": [
                        "uniform",
                        0.0,
                        0.5
                    ],
                    "n_layers": [
                        "int",
                        1,
                        4
                    ],
                    "residual_dropout": [
                        "?uniform",
                        0.0,
                        0.0,
                        0.2
                    ]
                },
                "training": {
                    "lr": [
                        "loguniform",
                        1e-05,
                        0.001
                    ],
                    "weight_decay": [
                        "loguniform",
                        1e-06,
                        0.001
                    ]
                }
            }
        },
        "program": "bin/ft_transformer.py"
    },
    "environment": {
        "devices": {
            "CUDA_VISIBLE_DEVICES": "1",
            "torch.version.cuda": "10.1",
            "torch.backends.cudnn.version()": 7603,
            "torch.cuda.nccl.version()": 2708,
            "driver": "440.33.01",
            "1": {
                "name": "GeForce RTX 2080 Ti",
                "total_memory": 11552096256
            }
        }
    },
    "best_stats": {
        "dataset": "california_housing",
        "algorithm": "ft_transformer",
        "config": {
            "data": {
                "normalization": "quantile",
                "path": "data/california_housing",
                "y_policy": "mean_std"
            },
            "model": {
                "activation": "reglu",
                "attention_dropout": 0.4518858598707761,
                "d_ffn_factor": 2.342425545888827,
                "d_token": 272,
                "ffn_dropout": 0.1462394754853018,
                "initialization": "kaiming",
                "n_heads": 8,
                "n_latent_tokens": 1,
                "n_layers": 3,
                "prenormalization": false,
                "residual_dropout": 0.0
            },
            "seed": 0,
            "training": {
                "batch_size": 256,
                "eval_batch_size": 8192,
                "lr": 9.230462560646988e-05,
                "n_epochs": 1000000000,
                "optimizer": "adamw",
                "patience": 16,
                "weight_decay": 2.242573649081314e-06
            }
        },
        "environment": {
            "devices": {
                "CUDA_VISIBLE_DEVICES": "1",
                "torch.version.cuda": "10.1",
                "torch.backends.cudnn.version()": 7603,
                "torch.cuda.nccl.version()": 2708,
                "driver": "440.33.01",
                "1": {
                    "name": "GeForce RTX 2080 Ti",
                    "total_memory": 11552096256
                }
            }
        },
        "epoch_size": 52,
        "n_parameters": 2463247,
        "best_epoch": 130,
        "metrics": {
            "train": {
                "rmse": 0.34729638013411923,
                "score": -0.34729638013411923
            },
            "val": {
                "rmse": 0.45779941414854475,
                "score": -0.45779941414854475
            },
            "test": {
                "rmse": 0.46096206007326207,
                "score": -0.46096206007326207
            }
        },
        "time": "0:01:40",
        "trial_id": 22
    },
    "time": "2:39:48"
}