datapath: data/gaussian50-20-1-1.pt
# bandit
num_arm: 50
dim_context: 20
T: 10000
sigma: 0.5 #1.0
func: quadform

# train
algo: NeuralES
model: neural
layers: [20, 20, 20]
act: ReLU
num_iter: 100
nu: 0.10
reg: 1.0
lr: 0.01
m: 10
tau: 50

# log
project: ContextualBandit-ICLR
group: Quadform-NeuralES