{
  "train_test_sets": {
    "L3": {
      "train_set": "100_to_150",
      "test_sets": [
        "100_to_150",
        "150_to_200",
        "200_to_250",
        "250_to_300"
      ]
    },
    "L4": {
      "train_set": "100_to_150",
      "test_sets": [
        "100_to_150",
        "150_to_200",
        "200_to_250",
        "250_to_300"
      ]
    },
    "L5": {
      "train_set": "100_to_150",
      "test_sets": [
        "100_to_150",
        "150_to_200",
        "200_to_250",
        "250_to_300"
      ]
    },
    "L6": {
      "train_set": "100_to_150",
      "test_sets": [
        "100_to_150",
        "150_to_200",
        "200_to_250",
        "250_to_300"
      ]
    },
    "L7": {
      "train_set": "100_to_150",
      "test_sets": [
        "100_to_150",
        "150_to_200",
        "200_to_250",
        "250_to_300"
      ]
    },
    "L8": {
      "train_set": "100_to_150",
      "test_sets": [
        "100_to_150",
        "150_to_200",
        "200_to_250",
        "250_to_300"
      ]
    },
    "L9": {
      "train_set": "100_to_150",
      "test_sets": [
        "100_to_150",
        "150_to_200",
        "200_to_250",
        "250_to_300"
      ]
    },
    "L10": {
      "train_set": "100_to_150",
      "test_sets": [
        "100_to_150",
        "150_to_200",
        "200_to_250",
        "250_to_300"
      ]
    },
    "L11": {
      "train_set": "100_to_150",
      "test_sets": [
        "100_to_150",
        "150_to_200",
        "200_to_250",
        "250_to_300"
      ]
    },
    "L12": {
      "train_set": "100_to_150",
      "test_sets": [
        "100_to_150",
        "150_to_200",
        "200_to_250",
        "250_to_300"
      ]
    }
  },
  "heads": [
    1
  ],
  "dims": [
    64,
    256
  ],
  "lrs": [
    0.00001,
    0.000001
  ],
  "epochs": 10,
  "layers": 1,
  "input_path": "data",
  "output_path": "1_layer/models",
  "train_split": 0.8,
  "bos_token": 2
}