{
    "dataset": "microsoft",
    "algorithm": "ft_transformer",
    "config": {
        "data": {
            "normalization": "quantile",
            "path": "data/microsoft",
            "y_policy": "mean_std"
        },
        "model": {
            "activation": "reglu",
            "attention_dropout": 0.2367026970034473,
            "d_ffn_factor": 1.333333333333333,
            "d_token": 104,
            "ffn_dropout": 0.08782495176671656,
            "initialization": "kaiming",
            "n_heads": 8,
            "n_layers": 2,
            "prenormalization": true,
            "residual_dropout": 0.0
        },
        "seed": 8,
        "training": {
            "batch_size": 1024,
            "eval_batch_size": 8192,
            "lr": 4.69162138270869e-05,
            "n_epochs": 1000000000,
            "optimizer": "adamw",
            "patience": 16,
            "weight_decay": 0.0009997786518737089
        }
    },
    "environment": {
        "devices": {
            "CUDA_VISIBLE_DEVICES": "0,1",
            "torch.version.cuda": "10.1",
            "torch.backends.cudnn.version()": 7603,
            "torch.cuda.nccl.version()": 2708,
            "driver": "450.80.02",
            "0": {
                "name": "Tesla V100-PCIE-32GB",
                "total_memory": 34089730048
            },
            "1": {
                "name": "Tesla V100-PCIE-32GB",
                "total_memory": 34089730048
            }
        }
    },
    "epoch_size": 707,
    "n_parameters": 203561,
    "best_epoch": 64,
    "metrics": {
        "train": {
            "rmse": 0.7200226260524589,
            "score": -0.7200226260524589
        },
        "val": {
            "rmse": 0.7430651150058897,
            "score": -0.7430651150058897
        },
        "test": {
            "rmse": 0.7457997750124894,
            "score": -0.7457997750124894
        }
    },
    "time": "0:43:13"
}
