{
    "dataset": "microsoft",
    "algorithm": "ft_transformer",
    "config": {
        "data": {
            "normalization": "quantile",
            "path": "data/microsoft",
            "y_policy": "mean_std"
        },
        "model": {
            "activation": "reglu",
            "attention_dropout": 0.2,
            "d_ffn_factor": 1.333333333333333,
            "d_token": 192,
            "ffn_dropout": 0.1,
            "initialization": "kaiming",
            "n_heads": 8,
            "n_layers": 3,
            "prenormalization": true,
            "residual_dropout": 0.0
        },
        "seed": 4,
        "training": {
            "batch_size": 1024,
            "eval_batch_size": 8192,
            "lr": 0.0001,
            "lr_n_decays": 0,
            "n_epochs": 1000000000,
            "optimizer": "adamw",
            "patience": 16,
            "weight_decay": 1e-05
        }
    },
    "environment": {
        "devices": {
            "CUDA_VISIBLE_DEVICES": "0,1",
            "torch.version.cuda": "10.1",
            "torch.backends.cudnn.version()": 7603,
            "torch.cuda.nccl.version()": 2708,
            "driver": "450.80.02",
            "0": {
                "name": "Tesla V100-PCIE-32GB",
                "total_memory": 34089730048
            },
            "1": {
                "name": "Tesla V100-PCIE-32GB",
                "total_memory": 34089730048
            }
        }
    },
    "epoch_size": 707,
    "n_parameters": 942331,
    "best_epoch": 14,
    "metrics": {
        "train": {
            "rmse": 0.721472631753193,
            "score": -0.721472631753193
        },
        "val": {
            "rmse": 0.7439889580674625,
            "score": -0.7439889580674625
        },
        "test": {
            "rmse": 0.7468085474093942,
            "score": -0.7468085474093942
        }
    },
    "time": "0:41:17"
}
