{
    "family": "san",
    "model_name": "gpt2",
    "train_steps": 100000,
    "n_dims": 15,
    "n_embd": 256,
    "n_layer": 12,
    "n_head": 8,
    "learning_rate": 0.0001,
    "gpu": [
        2,
        4
    ],
    "curriculum_points_start": 120,
    "curriculum_points_end": 120,
    "name": "mix8-linear_regression-quadratic_regression-relu_regression-sparse_linear_regression-decision_tree-sparse_parity_15_2-sparse_parity_15_3-disjunction_15",
    "task_list": [
        {
            "task": "linear_regression",
            "data": "gaussian",
            "batch_size": 64,
            "mu": 0,
            "scale": 1,
            "y_format": 0,
            "exp_name": "linear_regression"
        },
        {
            "task": "quadratic_regression",
            "data": "gaussian",
            "batch_size": 64,
            "mu": 0,
            "scale": 1,
            "y_format": 0,
            "exp_name": "quadratic_regression"
        },
        {
            "task": "relu_regression",
            "data": "gaussian",
            "batch_size": 64,
            "mu": 0,
            "scale": 1,
            "y_format": 0,
            "exp_name": "relu_regression"
        },
        {
            "task": "sparse_linear_regression",
            "data": "gaussian",
            "batch_size": 64,
            "mu": 0,
            "scale": 1,
            "sparsity": 3,
            "valid_coords": 10,
            "y_format": 0,
            "exp_name": "sparse_linear_regression"
        },
        {
            "task": "decision_tree",
            "data": "gaussian",
            "batch_size": 64,
            "depth": 4,
            "y_format": 0,
            "exp_name": "decision_tree"
        },
        {
            "task": "sparse_parity",
            "data": "boolean",
            "k": 2,
            "l": 105,
            "batch_size": 64,
            "y_format": 0,
            "exp_name": "sparse_parity_15_2"
        },
        {
            "task": "sparse_parity",
            "data": "boolean",
            "k": 3,
            "l": 455,
            "batch_size": 64,
            "y_format": 0,
            "exp_name": "sparse_parity_15_3"
        },
        {
            "task": "disjunction",
            "data": "boolean",
            "batch_size": 64,
            "y_format": 0,
            "exp_name": "disjunction_15"
        }
    ]
}