[
  {
    "label": "FFN Layer"
  },
  {
    "label": "Causal Attention"
  },
  {
    "label": "(Full Attention for original tokens, causal attention for hidden decoding tokens)"
  },
  {
    "label": "KV Projection"
  },
  {
    "label": "Token 1"
  },
  {
    "label": "Token 2"
  },
  {
    "label": "KV Cache for 3rd token"
  },
  {
    "label": "Token 3"
  },
  {
    "label": "Scaled Query Tokens"
  },
  {
    "label": "Q Projection"
  }
]