{
  "n": [8],
  "num_train_samples": [100000, 15000, 20000, 25000, 30000, 35000, 40000, 45000, 50000],
  "num_test_samples": 1000,
  "num_additional_node": 1,
  "RoPE": false,
  "lr": 0.0005,
  "batch_size": 2048,
  "shuffling": true,
  "low_train": -2,
  "high_train": 2,
  "low_test": [-6],
  "high_test": [6],
  "cumulative": true,
  "use_integer": false,
  "embed_dim": 64,
  "num_heads": 2,
  "mlp_hidden_dim": 128,
  "mlp_num_layers": 2,
  "epochs": 2001,
  "runs": 1,
  "weight_decay": 0.0000
}