{"n": [8], "num_train_samples": [5000, 10000, 15000, 20000, 25000, 30000, 35000, 40000, 45000, 50000], "num_test_samples": 1000, "num_additional_node": 1, "lr": 0.0005, "batch_size": 1000, "shuffling": true, "low_train": -2, "high_train": 2, "low_test": [-6], "high_test": [6], "cumulative": true, "use_integer": false, "variable_length": false, "embed_dim": 64, "num_heads": 2, "mlp_hidden_dim": 64, "mlp_num_layers": 2, "epochs": 2001, "runs": 10, "weight_decay": 0.0}