{
  "schema_version": "2.0",
  "metadata": {
    "diagram_id": "doc_layout_pipeline_v1"
  },
  "global_properties": {
    "topic": "Document Layout Analysis Pipeline",
    "purpose": "architecture_overview",
    "target_audience": "researcher",
    "complexity_level": "detailed_schematic",
    "domain": "Computer Vision",
    "visual_format": "block_diagram",
    "diagram_type": "architecture_diagram",
    "layout_grid": "5-tier_vertical",
    "style_theme": "professional_light",
    "background_color": "#FFFFFF",
    "font_family": "Helvetica, Arial, sans-serif",
    "title": {
      "text": "Document Layout Analysis Pipeline",
      "is_present": false
    }
  },
  "components": [
    {
      "id": "c_input",
      "type": "shape_node",
      "label": "Input",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#B4C6E7",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "bold",
        "text_color": "#000000"
      }
    },
    {
      "id": "gc_loader",
      "type": "group_container",
      "label": "Loader Layer",
      "geometry": {
        "shape": "rectangle"
      },
      "styling": {
        "fill_color": "#F6FFF6",
        "border_color": "#CCCCCC",
        "border_width": 0,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "bold",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_pdf",
      "type": "shape_node",
      "label": "Searchable PDF",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#C6E0B4",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_scanpdf",
      "type": "shape_node",
      "label": "Scan PDF / Image",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#C6E0B4",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_ppt",
      "type": "shape_node",
      "label": "MS Powerpoint",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#C6E0B4",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_word",
      "type": "shape_node",
      "label": "MS Word",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#C6E0B4",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_excel",
      "type": "shape_node",
      "label": "MS Excel",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#C6E0B4",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_html",
      "type": "shape_node",
      "label": "HTML",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#C6E0B4",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "gc_auxiliary",
      "type": "group_container",
      "label": "Auxiliary Layer",
      "geometry": {
        "shape": "rectangle"
      },
      "styling": {
        "fill_color": "#F6F6FF",
        "border_color": "#CCCCCC",
        "border_width": 0,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "bold",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_searchable",
      "type": "shape_node",
      "label": "Searchable / Non-searchable",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#EAD1DC",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_convert",
      "type": "shape_node",
      "label": "Convert File",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#EAD1DC",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_fixbroken",
      "type": "shape_node",
      "label": "Fix Broken File",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#EAD1DC",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_fixfont",
      "type": "shape_node",
      "label": "Fix Font Issue",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#EAD1DC",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "gc_layout",
      "type": "group_container",
      "label": "Layout Analysis Layer",
      "geometry": {
        "shape": "rectangle"
      },
      "styling": {
        "fill_color": "#FFF6E6",
        "border_color": "#CCCCCC",
        "border_width": 0,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "bold",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_dla",
      "type": "shape_node",
      "label": "DLA Models",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#F8CBAD",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "bold",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_dit",
      "type": "shape_node",
      "label": "DiT",
      "geometry": {
        "shape": "rectangle"
      },
      "styling": {
        "fill_color": "#FFFFFF",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_yolov9",
      "type": "shape_node",
      "label": "YOLOv9",
      "geometry": {
        "shape": "rectangle"
      },
      "styling": {
        "fill_color": "#FFFFFF",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_spreadsheet",
      "type": "shape_node",
      "label": "Spreadsheet Table Detection Model",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#F8CBAD",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "bold",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_rulebased",
      "type": "shape_node",
      "label": "Rule-based Layout Analysis",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#F8CBAD",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "bold",
        "text_color": "#000000"
      }
    },
    {
      "id": "gc_elements",
      "type": "group_container",
      "label": "Elements Layer",
      "geometry": {
        "shape": "rectangle"
      },
      "styling": {
        "fill_color": "#F6F6FF",
        "border_color": "#CCCCCC",
        "border_width": 0,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "bold",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_table",
      "type": "shape_node",
      "label": "Table",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#BDD7EE",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "bold",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_tableclassify",
      "type": "shape_node",
      "label": "Table Classify",
      "geometry": {
        "shape": "rectangle"
      },
      "styling": {
        "fill_color": "#FFFFFF",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_heuristic_table",
      "type": "shape_node",
      "label": "Heuristic",
      "geometry": {
        "shape": "rectangle"
      },
      "styling": {
        "fill_color": "#FFFFFF",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_tatr",
      "type": "shape_node",
      "label": "TATR",
      "geometry": {
        "shape": "rectangle"
      },
      "styling": {
        "fill_color": "#FFFFFF",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_figure",
      "type": "shape_node",
      "label": "Figure",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#BDD7EE",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "bold",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_figureclassify",
      "type": "shape_node",
      "label": "Figure Classify",
      "geometry": {
        "shape": "rectangle"
      },
      "styling": {
        "fill_color": "#FFFFFF",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_vlm",
      "type": "shape_node",
      "label": "VLM",
      "geometry": {
        "shape": "rectangle"
      },
      "styling": {
        "fill_color": "#FFFFFF",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_ocr",
      "type": "shape_node",
      "label": "OCR",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#BDD7EE",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "bold",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_rotated",
      "type": "shape_node",
      "label": "Rotated",
      "geometry": {
        "shape": "rectangle"
      },
      "styling": {
        "fill_color": "#FFFFFF",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_horizontal",
      "type": "shape_node",
      "label": "Horizontal",
      "geometry": {
        "shape": "rectangle"
      },
      "styling": {
        "fill_color": "#FFFFFF",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "gc_restructuring",
      "type": "group_container",
      "label": "Restructuring Layer",
      "geometry": {
        "shape": "rectangle"
      },
      "styling": {
        "fill_color": "#FFF6E6",
        "border_color": "#CCCCCC",
        "border_width": 0,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "bold",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_readingorder",
      "type": "shape_node",
      "label": "Reading Order",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#F8CBAD",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "bold",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_heuristic_reading",
      "type": "shape_node",
      "label": "Heuristic",
      "geometry": {
        "shape": "rectangle"
      },
      "styling": {
        "fill_color": "#FFFFFF",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_layoutlmv3_reading",
      "type": "shape_node",
      "label": "LayoutLMv3",
      "geometry": {
        "shape": "rectangle"
      },
      "styling": {
        "fill_color": "#FFFFFF",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_relation",
      "type": "shape_node",
      "label": "Relation Extraction",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#F8CBAD",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "bold",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_layoutlmv3_relation",
      "type": "shape_node",
      "label": "LayoutLMv3",
      "geometry": {
        "shape": "rectangle"
      },
      "styling": {
        "fill_color": "#FFFFFF",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "normal",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_hierarchy",
      "type": "shape_node",
      "label": "Hierarchy Recovering",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#F8CBAD",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "bold",
        "text_color": "#000000"
      }
    },
    {
      "id": "c_output",
      "type": "shape_node",
      "label": "Output",
      "geometry": {
        "shape": "rounded_rectangle"
      },
      "styling": {
        "fill_color": "#C6E0B4",
        "border_color": "#000000",
        "border_width": 1,
        "border_style": "solid"
      },
      "text_properties": {
        "font_weight": "bold",
        "text_color": "#000000"
      }
    }
  ],
  "connections": [
    {
      "id": "conn_input_loader",
      "from_id": "c_input",
      "to_id": "gc_loader",
      "label": {
        "text": "",
        "position": "middle_above",
        "text_color": "#000000"
      },
      "line_properties": {
        "type": "straight",
        "style": "solid",
        "color": "#000000",
        "width": 2
      },
      "arrowhead": {
        "start_type": "none",
        "end_type": "solid_triangle",
        "size": "medium"
      }
    },
    {
      "id": "conn_loader_aux",
      "from_id": "gc_loader",
      "to_id": "gc_auxiliary",
      "label": {
        "text": "",
        "position": "middle_above",
        "text_color": "#000000"
      },
      "line_properties": {
        "type": "straight",
        "style": "solid",
        "color": "#000000",
        "width": 2
      },
      "arrowhead": {
        "start_type": "none",
        "end_type": "solid_triangle",
        "size": "medium"
      }
    },
    {
      "id": "conn_aux_layout",
      "from_id": "gc_auxiliary",
      "to_id": "gc_layout",
      "label": {
        "text": "",
        "position": "middle_above",
        "text_color": "#000000"
      },
      "line_properties": {
        "type": "straight",
        "style": "solid",
        "color": "#000000",
        "width": 2
      },
      "arrowhead": {
        "start_type": "none",
        "end_type": "solid_triangle",
        "size": "medium"
      }
    },
    {
      "id": "conn_layout_elements",
      "from_id": "gc_layout",
      "to_id": "gc_elements",
      "label": {
        "text": "",
        "position": "middle_above",
        "text_color": "#000000"
      },
      "line_properties": {
        "type": "straight",
        "style": "solid",
        "color": "#000000",
        "width": 2
      },
      "arrowhead": {
        "start_type": "none",
        "end_type": "solid_triangle",
        "size": "medium"
      }
    },
    {
      "id": "conn_elements_restructuring",
      "from_id": "gc_elements",
      "to_id": "gc_restructuring",
      "label": {
        "text": "",
        "position": "middle_above",
        "text_color": "#000000"
      },
      "line_properties": {
        "type": "straight",
        "style": "solid",
        "color": "#000000",
        "width": 2
      },
      "arrowhead": {
        "start_type": "none",
        "end_type": "solid_triangle",
        "size": "medium"
      }
    },
    {
      "id": "conn_restructuring_output",
      "from_id": "gc_restructuring",
      "to_id": "c_output",
      "label": {
        "text": "",
        "position": "middle_above",
        "text_color": "#000000"
      },
      "line_properties": {
        "type": "straight",
        "style": "solid",
        "color": "#000000",
        "width": 2
      },
      "arrowhead": {
        "start_type": "none",
        "end_type": "solid_triangle",
        "size": "medium"
      }
    }
  ],
  "layout_constraints": [
    {
      "type": "containment",
      "container_id": "gc_loader",
      "element_ids": [
        "c_pdf",
        "c_scanpdf",
        "c_ppt",
        "c_word",
        "c_excel",
        "c_html"
      ],
      "padding": "medium"
    },
    {
      "type": "distribution",
      "distribution_type": "horizontal_equal_spacing",
      "element_ids": [
        "c_pdf",
        "c_scanpdf",
        "c_ppt",
        "c_word",
        "c_excel",
        "c_html"
      ]
    },
    {
      "type": "containment",
      "container_id": "gc_auxiliary",
      "element_ids": [
        "c_searchable",
        "c_convert",
        "c_fixbroken",
        "c_fixfont"
      ],
      "padding": "medium"
    },
    {
      "type": "distribution",
      "distribution_type": "horizontal_equal_spacing",
      "element_ids": [
        "c_searchable",
        "c_convert",
        "c_fixbroken",
        "c_fixfont"
      ]
    },
    {
      "type": "containment",
      "container_id": "gc_layout",
      "element_ids": [
        "c_dla",
        "c_spreadsheet",
        "c_rulebased"
      ],
      "padding": "medium"
    },
    {
      "type": "distribution",
      "distribution_type": "horizontal_equal_spacing",
      "element_ids": [
        "c_dla",
        "c_spreadsheet",
        "c_rulebased"
      ]
    },
    {
      "type": "containment",
      "container_id": "c_dla",
      "element_ids": [
        "c_dit",
        "c_yolov9"
      ],
      "padding": "small"
    },
    {
      "type": "distribution",
      "distribution_type": "horizontal_equal_spacing",
      "element_ids": [
        "c_dit",
        "c_yolov9"
      ]
    },
    {
      "type": "containment",
      "container_id": "gc_elements",
      "element_ids": [
        "c_table",
        "c_figure",
        "c_ocr"
      ],
      "padding": "medium"
    },
    {
      "type": "distribution",
      "distribution_type": "horizontal_equal_spacing",
      "element_ids": [
        "c_table",
        "c_figure",
        "c_ocr"
      ]
    },
    {
      "type": "containment",
      "container_id": "c_table",
      "element_ids": [
        "c_tableclassify",
        "c_heuristic_table",
        "c_tatr"
      ],
      "padding": "small"
    },
    {
      "type": "distribution",
      "distribution_type": "horizontal_equal_spacing",
      "element_ids": [
        "c_tableclassify",
        "c_heuristic_table",
        "c_tatr"
      ]
    },
    {
      "type": "containment",
      "container_id": "c_figure",
      "element_ids": [
        "c_figureclassify",
        "c_vlm"
      ],
      "padding": "small"
    },
    {
      "type": "distribution",
      "distribution_type": "horizontal_equal_spacing",
      "element_ids": [
        "c_figureclassify",
        "c_vlm"
      ]
    },
    {
      "type": "containment",
      "container_id": "c_ocr",
      "element_ids": [
        "c_rotated",
        "c_horizontal"
      ],
      "padding": "small"
    },
    {
      "type": "distribution",
      "distribution_type": "horizontal_equal_spacing",
      "element_ids": [
        "c_rotated",
        "c_horizontal"
      ]
    },
    {
      "type": "containment",
      "container_id": "gc_restructuring",
      "element_ids": [
        "c_readingorder",
        "c_relation",
        "c_hierarchy"
      ],
      "padding": "medium"
    },
    {
      "type": "distribution",
      "distribution_type": "horizontal_equal_spacing",
      "element_ids": [
        "c_readingorder",
        "c_relation",
        "c_hierarchy"
      ]
    },
    {
      "type": "containment",
      "container_id": "c_readingorder",
      "element_ids": [
        "c_heuristic_reading",
        "c_layoutlmv3_reading"
      ],
      "padding": "small"
    },
    {
      "type": "distribution",
      "distribution_type": "horizontal_equal_spacing",
      "element_ids": [
        "c_heuristic_reading",
        "c_layoutlmv3_reading"
      ]
    },
    {
      "type": "containment",
      "container_id": "c_relation",
      "element_ids": [
        "c_layoutlmv3_relation"
      ],
      "padding": "small"
    }
  ]
}