{
    "dataset": "microsoft-OpenFE-10",
    "algorithm": "ft_transformer",
    "config": {
        "data": {
            "normalization": "quantile",
            "path": "data/microsoft-OpenFE-10",
            "y_policy": "mean_std"
        },
        "model": {
            "activation": "reglu",
            "attention_dropout": 0.2367026970034473,
            "d_ffn_factor": 1.333333333333333,
            "d_token": 104,
            "ffn_dropout": 0.08782495176671656,
            "initialization": "kaiming",
            "n_heads": 8,
            "n_layers": 2,
            "prenormalization": true,
            "residual_dropout": 0.0
        },
        "seed": 0,
        "training": {
            "batch_size": 1024,
            "eval_batch_size": 8192,
            "lr": 4.69162138270869e-05,
            "n_epochs": 1000000000,
            "optimizer": "adamw",
            "patience": 16,
            "weight_decay": 0.0009997786518737089
        }
    },
    "environment": {
        "devices": {
            "CUDA_VISIBLE_DEVICES": "0",
            "torch.version.cuda": "10.1",
            "torch.backends.cudnn.version()": 7603,
            "torch.cuda.nccl.version()": 2708,
            "driver": "455.32.00",
            "0": {
                "name": "Tesla V100-PCIE-16GB",
                "total_memory": 16945512448
            }
        }
    },
    "epoch_size": 707,
    "n_parameters": 205641,
    "eval_batch_size": 4096,
    "best_epoch": 62,
    "metrics": {
        "train": {
            "rmse": 0.714838803152565,
            "score": -0.714838803152565
        },
        "val": {
            "rmse": 0.7393260232245932,
            "score": -0.7393260232245932
        },
        "test": {
            "rmse": 0.7401550693067559,
            "score": -0.7401550693067559
        }
    },
    "time": "1:28:13"
}
