{
  "file": "t2i_16_gpto3_step_32_low.pdf",
  "precision": 0.5714,
  "recall": 0.4,
  "design_errs": 14,
  "design_score": 0.4167,
  "blank_ratio": 0.05,
  "blank_score": 0.9091,
  "readability": 0.5,
  "align": 0.8659,
  "step": 32,
  "final_raw": 0.5347,
  "final": 0.4636,
  "text_json": "t2i_16_gpto3_step_32_low_pdf_labels.json",
  "png": "t2i_16_gpto3_step_32_low.png",
  "grid_png": "t2i_16_gpto3_step_32_low_grid.png",
  "gpt_json": "t2i_16_gpto3_step_32_low_pdf_labels_readability.json",
  "design_analysis": "1. Module 1: \"Temporal Context Encoder\\nHW D\" text overflows its box, with 'HW D' extending beyond the right boundary of the module.\n2. Module 2: \"Spatial Context Encoder\\nHW D\" text also overflows its box in the same manner.\n3. Module 3: The oval \"C\\nHW\\n2D\" in the middle significantly overlaps the pathway arrows from both the Temporal and Spatial Context Encoders, causing visual confusion.\n4. Module 4: Arrow from the right-side \"Conv 11\" (under \"Image\") merges awkwardly into the post-BN (Batch Norm) pathway, leading to ambiguity about data flow and process order.\n5. Module 5: The horizontal alignment of the two input blocks \"Events Input\\nV T K+1 K\" and \"Image Input\\nI T K\" does not match their relevant encoders; they are visually disconnected and could confuse the directionality of data.\n6. Module 6: The main convolutional blocks (Conv 11, Conv 33, ReLU, etc.) do not have uniform left/right margins, with some blocks not being horizontally aligned with others, leading to inconsistency.\n7. Module 7: The final output block \"SpatioTemporal Context Feature\\nHW D\" text does not fit within the width of its box, causing awkward line breaking.\n8. Module 8: The design uses duplicate \"Conv 11\" modules without clear differentiation or numbering, making the structure appear redundant and potentially ambiguous for readers trying to follow data flow.\n9. Module 9: The path from \"Spatial Context Encoder\\nHW D\" to its first \"Conv 11\" (right side) is misaligned vertically compared with the rest of the chart, breaking visual consistency.\n10. Module 10: The use of color for module types is inconsistent—the two input blocks (green) are not clearly defined as separate from other processes, and their styling is not matched in the legend.\n11. Module 11: The \"Events Input\" and \"Image Input\" blocks have inconsistent spacing between line breaks in their text, making the two blocks look visually unbalanced.\n12. Module 12: The shape for \"C HW 2D\" module is inconsistent with all other modules, being an oval instead of a rectangle, disrupting the visual system of representation.\n13. Module 13: There is a redundant black frame at the boundary of the image, which adds no extra information or function.\n14. Module 14: The connections from the Temporal and Spatial Context Encoders both enter the oval \"C HW 2D\" from above and the side, but the arrowheads are inconsistent in their placement and clarity.\n",
  "pdf_norm": [
    "events",
    "image",
    "temporalcontextencodernhwd",
    "spatialcontextencodernhwd",
    "cnhw2d",
    "conv11",
    "conv33",
    "relu",
    "conv11",
    "bn",
    "conv11",
    "spatiotemporalcontextfeaturenhwd",
    "eventsinputnvtk+1tk",
    "imageinputnitk"
  ],
  "read_norm": [
    "events",
    "image",
    "temporalcontextencoder",
    "hwd",
    "spatialcontextencoder",
    "hwd",
    "conv11",
    "conv33",
    "relu",
    "conv11",
    "bn",
    "spatiotemporalcontextfeature",
    "hwd",
    "eventsinput",
    "vtk+1tk",
    "imageinput",
    "itk",
    "hw",
    "c",
    "2d"
  ],
  "gt_norm": [
    "events",
    "temporalcontextencoder",
    "hwd",
    "image",
    "spatialcontextencoder",
    "hwd",
    "c",
    "hw2d",
    "conv11",
    "conv33",
    "relu",
    "conv11",
    "bn",
    "conv11",
    "spatiotemporalcontextfeature",
    "hwd",
    "eventsinput",
    "vtk+1tk",
    "imageinput",
    "itk"
  ]
}