seed = 0
function = "bin.model.main"
n_trials = 100

[sampler]
n_startup_trials = 20

[space]
seed = 0
batch_size = 256
patience = 16
n_epochs = -1
gradient_clipping_norm = 1.0
amp = true

[space.data]
cache = true
path = "data/regression-cat-medium-0-OnlineNewsPopularity"
num_policy = "noisy-quantile"

[space.optimizer]
type = "AdamW"
lr = [
    "_tune_",
    "loguniform",
    0.0001,
    0.003,
]
weight_decay = [
    "_tune_",
    "?loguniform",
    0.0,
    0.0001,
    0.1,
]

[space.model]
arch_type = "tabm-mini"
k = 32
share_training_batches = false

[space.model.backbone]
type = "MLP"
n_blocks = [
    "_tune_",
    "int",
    1,
    4,
]
d_block = [
    "_tune_",
    "int",
    64,
    1024,
    16,
]
dropout = [
    "_tune_",
    "?uniform",
    0.0,
    0.0,
    0.5,
]

[space.model.num_embeddings]
type = "GGPLEmbeddings"
d_embedding = [
    "_tune_",
    "int",
    8,
    32,
    4,
]
dropout_ratio = [
    "_tune_",
    "?uniform",
    0.0,
    0.0,
    0.3,
]

[space.bins]
n_bins = [
    "_tune_",
    "int",
    2,
    48,
]

[space.bins.tree_kwargs]
type = "xgb_global"
