title = "Configuration file used for comparing gradient-based optimizers against random-feature sampling"

repeat = 3
dof = 3
dtype = "float"
auto_diff_mode = "forward"
device = "cuda"
N = [ 3, 3 ]

# comparison of 'swim' against 15 optimizers using all optimizers available in the current pytorch version
optim_types = [ "swim", "adam", "adamw", "radam", "nadam", "adamax", "sgd", "sgdmomentum", "adagrad", "adadelta", "adafactor", "asgd", "lbfgs", "rmsprop", "rprop" ]

[data]
n_points = 2000
train_test_split = 0.5
mass = 1.0
spring_constant = 1.0
x_min = -0.5
x_max = 0.5
meshing = "rectangular"
data_seed = 19582

[model]
width = 384
enc_width = 48
direct = false
local_pooling = "sum"
global_pooling = "sum"
activ_str = "softplus"
init_method = "relu"
model_seed = 98745

[train]
param_sampler = "relu"
resample_duplicates = true
driver = "gels"
rcond = 1e-6
sampling_seed = 5924
n_steps = 10_000 # number of mini-batch updates
batch_size = 256
weight_init = "kaiming_normal"
lr_start = 0.01
lr_start_sgd = 5e-4
lr_lbfgs_adadelta = 0.1
lr_end = 5e-5
weight_decay = 1e-6
patience = 10_000   # no patience
sched_type = "exponential"

