python main.py data=camera model.neomlp_attention.ffn_dim=128 model.embed_dim=128 \
  model.neomlp_attention.num_heads=4 model.neomlp_attention.num_layers=3 \
  data.batch_size=65536 optim.lr=5e-3 model.pos_embedding_dim=256 \
  model.pos_embedding_sigma=20.0 model.num_nodes=16 \
  model.neomlp_attention.use_layer_norm=False data.num_epochs=10001 \
  pre_load_to_device=False model.input_init_sigma=0.001 model.init_sigma=0.001
