{
  "train_test_sets": {
    "L3": {
      "train_set": "100_to_150",
      "test_sets": ["100_to_150","150_to_200","200_to_250","250_to_300"]
    },
    "L4": {
      "train_set": "100_to_150",
      "test_sets": ["100_to_150","150_to_200","200_to_250","250_to_300"]
    },
    "L5": {
      "train_set": "100_to_150",
      "test_sets": ["100_to_150","150_to_200","200_to_250","250_to_300"]
    },
    "L6": {
      "train_set": "100_to_150",
      "test_sets": ["100_to_150","150_to_200","200_to_250","250_to_300"]
    },
    "L7": {
      "train_set": "100_to_150",
      "test_sets": ["100_to_150","150_to_200","200_to_250","250_to_300"]
    },
    "L8": {
      "train_set": "100_to_150",
      "test_sets": ["100_to_150","150_to_200","200_to_250","250_to_300"]
    },
    "L9": {
      "train_set": "100_to_150",
      "test_sets": ["100_to_150","150_to_200","200_to_250","250_to_300"]
    },
    "L10": {
      "train_set": "100_to_150",
      "test_sets": ["100_to_150","150_to_200","200_to_250","250_to_300"]
    },
    "L11": {
      "train_set": "100_to_150",
      "test_sets": ["100_to_150","150_to_200","200_to_250","250_to_300"]
    },
    "L12": {
      "train_set": "100_to_150",
      "test_sets": ["100_to_150","150_to_200","200_to_250","250_to_300"]
    }
  },
  "heads": [
    1
  ],
  "dims": [64,
    256],
  "lrs": [
    0.00001,
    0.000001
  ],
  "epochs": 10,
  "layers": 9,
  "input_path": "data",
  "output_path": "9_layer/models",
  "train_split": 0.8,
  "bos_token": 2
}

