{
    "config": {
        "base_config": {
            "data": {
                "normalization": "quantile",
                "path": "data/jannis"
            },
            "model": {
                "activation": "reglu",
                "initialization": "kaiming",
                "n_heads": 8,
                "prenormalization": false
            },
            "seed": 0,
            "training": {
                "batch_size": 512,
                "eval_batch_size": 8192,
                "n_epochs": 1000000000,
                "optimizer": "adamw",
                "patience": 16
            }
        },
        "optimization": {
            "options": {
                "n_trials": 100
            },
            "sampler": {
                "seed": 0
            },
            "space": {
                "model": {
                    "attention_dropout": [
                        "uniform",
                        0.0,
                        0.5
                    ],
                    "d_ffn_factor": [
                        "$d_ffn_factor",
                        1.0,
                        4.0
                    ],
                    "d_token": [
                        "$d_token",
                        64,
                        512
                    ],
                    "ffn_dropout": [
                        "uniform",
                        0.0,
                        0.5
                    ],
                    "n_layers": [
                        "int",
                        1,
                        4
                    ],
                    "residual_dropout": [
                        "?uniform",
                        0.0,
                        0.0,
                        0.2
                    ]
                },
                "training": {
                    "lr": [
                        "loguniform",
                        1e-05,
                        0.001
                    ],
                    "weight_decay": [
                        "loguniform",
                        1e-06,
                        0.001
                    ]
                }
            }
        },
        "program": "bin/ft_transformer.py"
    },
    "environment": {
        "devices": {
            "CUDA_VISIBLE_DEVICES": "1",
            "torch.version.cuda": "10.1",
            "torch.backends.cudnn.version()": 7603,
            "torch.cuda.nccl.version()": 2708,
            "driver": "440.33.01",
            "1": {
                "name": "GeForce RTX 2080 Ti",
                "total_memory": 11552096256
            }
        }
    },
    "best_stats": {
        "dataset": "jannis",
        "algorithm": "ft_transformer",
        "config": {
            "data": {
                "normalization": "quantile",
                "path": "data/jannis"
            },
            "model": {
                "activation": "reglu",
                "attention_dropout": 0.4194914895568438,
                "d_ffn_factor": 1.061031416526688,
                "d_token": 288,
                "ffn_dropout": 0.4632881116664471,
                "initialization": "kaiming",
                "n_heads": 8,
                "n_latent_tokens": 1,
                "n_layers": 4,
                "prenormalization": false,
                "residual_dropout": 0.0
            },
            "seed": 0,
            "training": {
                "batch_size": 512,
                "eval_batch_size": 8192,
                "lr": 0.0001089430445312344,
                "n_epochs": 1000000000,
                "optimizer": "adamw",
                "patience": 16,
                "weight_decay": 2.897993930091118e-05
            }
        },
        "environment": {
            "devices": {
                "CUDA_VISIBLE_DEVICES": "1",
                "torch.version.cuda": "10.1",
                "torch.backends.cudnn.version()": 7603,
                "torch.cuda.nccl.version()": 2708,
                "driver": "440.33.01",
                "1": {
                    "name": "GeForce RTX 2080 Ti",
                    "total_memory": 11552096256
                }
            }
        },
        "epoch_size": 105,
        "n_parameters": 2426540,
        "best_epoch": 49,
        "metrics": {
            "train": {
                "0": {
                    "precision": 0.615909090909091,
                    "recall": 0.25092592592592594,
                    "f1-score": 0.35657894736842105,
                    "support": 1080
                },
                "1": {
                    "precision": 0.6899058811812161,
                    "recall": 0.7519131614654003,
                    "f1-score": 0.7195761699475407,
                    "support": 18425
                },
                "2": {
                    "precision": 0.7728077422400567,
                    "recall": 0.6943796394485684,
                    "f1-score": 0.7314975143830643,
                    "support": 9430
                },
                "3": {
                    "precision": 0.8437830365129706,
                    "recall": 0.8417636798766884,
                    "f1-score": 0.8427721485572724,
                    "support": 24653
                },
                "accuracy": 0.7730275434798836,
                "macro avg": {
                    "precision": 0.7306014377108336,
                    "recall": 0.6347456016791457,
                    "f1-score": 0.6626061950640746,
                    "support": 53588
                },
                "weighted avg": {
                    "precision": 0.7737937203744071,
                    "recall": 0.7730275434798836,
                    "f1-score": 0.7710341780521025,
                    "support": 53588
                },
                "score": 0.7730275434798836
            },
            "val": {
                "0": {
                    "precision": 0.4574468085106383,
                    "recall": 0.15925925925925927,
                    "f1-score": 0.23626373626373628,
                    "support": 270
                },
                "1": {
                    "precision": 0.6504147278980377,
                    "recall": 0.6978510961580204,
                    "f1-score": 0.6732984293193718,
                    "support": 4607
                },
                "2": {
                    "precision": 0.7305529522024368,
                    "recall": 0.6614340263046246,
                    "f1-score": 0.6942774437764418,
                    "support": 2357
                },
                "3": {
                    "precision": 0.8188533804400193,
                    "recall": 0.8272225827384815,
                    "f1-score": 0.8230167056734727,
                    "support": 6164
                },
                "accuracy": 0.7401104642483953,
                "macro avg": {
                    "precision": 0.664316967262783,
                    "recall": 0.5864417411150964,
                    "f1-score": 0.6067140787582557,
                    "support": 13398
                },
                "weighted avg": {
                    "precision": 0.7381173932749331,
                    "recall": 0.7401104642483953,
                    "f1-score": 0.7370625452618237,
                    "support": 13398
                },
                "score": 0.7401104642483953
            },
            "test": {
                "0": {
                    "precision": 0.3302752293577982,
                    "recall": 0.10682492581602374,
                    "f1-score": 0.1614349775784753,
                    "support": 337
                },
                "1": {
                    "precision": 0.6433151651170247,
                    "recall": 0.6969433831191386,
                    "f1-score": 0.6690563521173725,
                    "support": 5758
                },
                "2": {
                    "precision": 0.7256536566881394,
                    "recall": 0.6498133695283339,
                    "f1-score": 0.6856426781238811,
                    "support": 2947
                },
                "3": {
                    "precision": 0.8138126530086329,
                    "recall": 0.8197274497079818,
                    "f1-score": 0.8167593430751325,
                    "support": 7705
                },
                "accuracy": 0.7332656595211082,
                "macro avg": {
                    "precision": 0.6282641760428989,
                    "recall": 0.5683272820428695,
                    "f1-score": 0.5832233377237154,
                    "support": 16747
                },
                "weighted avg": {
                    "precision": 0.7299480080449555,
                    "recall": 0.7332656595211082,
                    "f1-score": 0.7297157564794143,
                    "support": 16747
                },
                "score": 0.7332656595211082
            }
        },
        "time": "0:10:40",
        "trial_id": 89
    },
    "time": "22:44:56"
}