model: mlp
model_path: energy_ce
dataset_name: energy
loss_type: cross_entropy
range_size: 50
batch_size: 32
devices: 0
lr: 1e-4
ffn_activation: relu
ffn_hidden_dim: 1000
ffn_num_layers: 4
constraint_weights: 0, 1
max_epochs: 3000
weight_decay: 1e-4
optimizer: adamw
lq_norm_val: .5
