data:
  dataset: 'MNIST'                      # MNIST, CIFAR10, SVHN, classification_gradient
  distribution: null   
  label_function: null                  # parity, all, interval
  num_workers: 4                        # number of data loading workers
  batch_size: 1000
  data_size: 20000
  dim_full: 784              
  dim_input: 784
  feature_dim: null
  effective_dim: null 
  noise: null
  structure: True 
model:
  type: "adp"                           # adp, one ,two, fix, ntk
  hidden_dim: 100 
  label_num: 1
train:
  net: null                             # path to net (to continue training)
  niter: 100                            # number of epochs to train for
  lr: 0.1                               # learning rate 
  optimizer: "sgd"                      # adam, sgd 
  weight_decay: 0.0      
  decay: "l2"                           # l1, l2, null
  loss: "hinge"                         # hinge, cross