{"n": [8], "num_train_samples": [30000], "num_test_samples": 1000, "num_additional_node": 1, "RoPE": false, "lr": 0.0005, "batch_size": 1000, "shuffling": true, "low_train": -2, "high_train": 2, "low_test": [-2, -4, -6, -8, -10, -12, -14, -16, -18, -20], "high_test": [2, 4, 6, 8, 10, 12, 14, 16, 18, 20], "cumulative": true, "use_integer": false, "embed_dim": 64, "num_heads": 2, "mlp_hidden_dim": 64, "mlp_num_layers": 2, "epochs": 2001, "runs": 10, "weight_decay": 0.0, "variable_length": false, "pos_enc_type": "sinusoidal"}