seed = 0
n_models = 64
batch_size = 1024
n_epochs = -1
patience = 16
amp_dtype = "bfloat16"
save_all_predictions = true
track_online_ensemble_history = true
track_experiments = true

[data]
path = "data/tabred/maps-routing"
extract_bin_from_num = true
bin_policy = "convert-to-cat"
cat_policy = "ordinal"
cache = true

[model]
activation = "ReLU"
d_block = 384

[model.num_embeddings]
type = "PeriodicEmbeddingsPack"
bias = true
elementwise_affine = true
concat_input = true

[optimizer]
type = "MuonAdamWPack"
shared_step = true

[online_ensembles.greedy]
type = "greedy"
update_type = "latest"
include_current_ensemble_in_pool = true
patience = 32

[online_ensembles.greedy.options]
max_ensemble_size = 32

[sampler]
type = "RandomSampler"

[sampler.space.model]
n_blocks = ["_tune_", "int", 1, 3]
dropout = ["_tune_", "?uniform", 0.0, 0.0, 0.5]

[sampler.space.model.num_embeddings]
d_embedding = ["_tune_", "int", 8, 24, 4]
init_scale = ["_tune_", "loguniform", 0.01, 10.0]

[sampler.space.optimizer]
lr = ["_tune_", "loguniform", 0.0001, 0.005]
weight_decay = ["_tune_", "loguniform", 0.001, 1.0]
muon_lr = ["_tune_", "loguniform", 0.001, 0.1]
