{
  "model": {
    "Feature": 384,
    "ATTN Feature": 768,
    "FFN Feature": 1536,
    "Head Count": 8,
    "Decoder Count": 6,
    "Init Scalar": 0.05,
    "RoPE Base": 500,
    "Max Length": 64
  },
  "train": {
    "Peak LR": 0.0005,
    "Grads Clipping": 1,
    "Weight Decay": 0.00001,
    "Total Steps": 20000,
    "Warmup Steps": 1000,
    "Anneal Steps": 1600,
    "Accumulation": 1,
    "Batch Size": 512
  }
}