{
    "config": {
        "base_config": {
            "data": {
                "normalization": "quantile",
                "path": "data/microsoft",
                "y_policy": "mean_std"
            },
            "model": {
                "activation": "reglu",
                "d_ffn_factor": 1.333333333333333,
                "initialization": "kaiming",
                "n_heads": 8,
                "prenormalization": true,
                "residual_dropout": 0.0,
                "token_bias": false,
                "token_cat_bias": false
            },
            "seed": 0,
            "training": {
                "batch_size": 1024,
                "eval_batch_size": 8192,
                "n_epochs": 1000000000,
                "optimizer": "adamw",
                "patience": 16
            }
        },
        "optimization": {
            "options": {
                "n_trials": 50
            },
            "sampler": {
                "seed": 0
            },
            "space": {
                "model": {
                    "attention_dropout": [
                        "uniform",
                        0.0,
                        0.5
                    ],
                    "d_token": [
                        "$d_token",
                        64,
                        512
                    ],
                    "ffn_dropout": [
                        "uniform",
                        0.0,
                        0.5
                    ],
                    "n_layers": [
                        "int",
                        1,
                        6
                    ]
                },
                "training": {
                    "lr": [
                        "loguniform",
                        3e-05,
                        0.0003
                    ],
                    "weight_decay": [
                        "loguniform",
                        1e-06,
                        0.001
                    ]
                }
            }
        },
        "program": "bin/ft_transformer.py"
    },
    "environment": {
        "devices": {
            "CUDA_VISIBLE_DEVICES": "0,1,2",
            "torch.version.cuda": "10.1",
            "torch.backends.cudnn.version()": 7603,
            "torch.cuda.nccl.version()": 2708,
            "driver": "450.80.02",
            "0": {
                "name": "Tesla V100-PCIE-32GB",
                "total_memory": 34089730048
            },
            "1": {
                "name": "Tesla V100-PCIE-32GB",
                "total_memory": 34089730048
            },
            "2": {
                "name": "Tesla V100-PCIE-32GB",
                "total_memory": 34089730048
            }
        }
    },
    "continuations": [
        4,
        23
    ],
    "best_stats": {
        "dataset": "microsoft",
        "algorithm": "ft_transformer",
        "config": {
            "data": {
                "normalization": "quantile",
                "path": "data/microsoft",
                "y_policy": "mean_std"
            },
            "model": {
                "activation": "reglu",
                "attention_dropout": 0.1558926086578752,
                "d_ffn_factor": 1.333333333333333,
                "d_token": 192,
                "ffn_dropout": 0.1400961316024743,
                "initialization": "kaiming",
                "n_heads": 8,
                "n_layers": 5,
                "prenormalization": true,
                "residual_dropout": 0.0,
                "token_bias": false,
                "token_cat_bias": false
            },
            "seed": 0,
            "training": {
                "batch_size": 1024,
                "eval_batch_size": 8192,
                "lr": 0.0001688316076012206,
                "n_epochs": 1000000000,
                "optimizer": "adamw",
                "patience": 16,
                "weight_decay": 0.0006582641175048847
            }
        },
        "environment": {
            "devices": {
                "CUDA_VISIBLE_DEVICES": "0,1,2",
                "torch.version.cuda": "10.1",
                "torch.backends.cudnn.version()": 7603,
                "torch.cuda.nccl.version()": 2708,
                "driver": "450.80.02",
                "0": {
                    "name": "Tesla V100-PCIE-32GB",
                    "total_memory": 34089730048
                },
                "1": {
                    "name": "Tesla V100-PCIE-32GB",
                    "total_memory": 34089730048
                },
                "2": {
                    "name": "Tesla V100-PCIE-32GB",
                    "total_memory": 34089730048
                }
            }
        },
        "epoch_size": 707,
        "n_parameters": 1509367,
        "best_epoch": 16,
        "metrics": {
            "train": {
                "rmse": 0.7180501799268438,
                "score": -0.7180501799268438
            },
            "val": {
                "rmse": 0.7461653578185747,
                "score": -0.7461653578185747
            },
            "test": {
                "rmse": 0.7501609668926527,
                "score": -0.7501609668926527
            }
        },
        "time": "0:56:44",
        "trial_id": 36,
        "tuning_time": "1 day, 18:29:52"
    },
    "time": "2 days, 12:21:11"
}
