{
    "uuid": {
        "function": "get_ai_research_metadata",
        "field": "uuid"
    },
    "pipeline": [
        {
            "function": "get_ai_research_metadata",
            "args": {
                "deps": [
                    "input_pdf"
                ],
                "kwargs": {
                    "model": "gpt-4o-mini",
                    "temperature": 0.1,
                    "api_tools": [],
                    "write_to_json": true,
                    "title_lines": 20,
                    "volume_lines": 10,
                    "tldr_max_length": 80,
                    "tag_number": 5,
                    "dataset_dir": "data/dataset/m3sciqa"
                }
            }
        },
        {
            "function": "get_ai_research_pdf_data",
            "args": {
                "deps": [
                    "get_ai_research_metadata"
                ],
                "kwargs": {
                    "processed_data_folder": "data/dataset/m3sciqa/processed_data",
                    "TOC_threshold": 0.9
                }
            }
        },
        {
            "function": "get_ai_research_page_info",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_pdf_data"
                ],
                "kwargs": {
                    "max_length": 50,
                    "model": "gpt-4o-mini",
                    "temperature": 0.1,
                    "top_p": 0.95
                }
            }
        },
        {
            "function": "get_ai_research_per_page_chunk_info",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_page_info"
                ],
                "kwargs": {
                    "chunk_size": 512,
                    "chunk_overlap": 0
                }
            }
        },
        {
            "function": "get_ai_research_section_info",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_pdf_data"
                ],
                "kwargs": {
                    "max_length": 50,
                    "model": "gpt-4o-mini",
                    "temperature": 0.1,
                    "top_p": 0.95
                }
            }
        },
        {
            "function": "get_ai_research_per_page_table_info",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_pdf_data"
                ],
                "kwargs": {
                    "max_length": 50,
                    "model": "gpt-4o-mini",
                    "temperature": 0.1,
                    "top_p": 0.95
                }
            }
        },
        {
            "function": "get_ai_research_per_page_image_info",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_pdf_data"
                ],
                "kwargs": {
                    "max_length": 50,
                    "model": "gpt-4o-mini",
                    "temperature": 0.1,
                    "top_p": 0.95
                }
            }
        },
        {
            "function": "get_ai_research_per_page_equation_info",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_pdf_data"
                ]
            }
        },
        {
            "function": "get_ai_research_reference_info",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_pdf_data",
                    "get_ai_research_page_info"
                ],
                "kwargs": {
                    "threshold": 0.9
                }
            }
        },
        {
            "function": "write_summary_json",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_pdf_data",
                    "get_ai_research_page_info",
                    "get_ai_research_section_info",
                    "get_ai_research_per_page_table_info",
                    "get_ai_research_per_page_image_info"
                ],
                "kwargs": {
                    "processed_data_folder": "data/dataset/m3sciqa/processed_data"
                }
            }
        }
    ],
    "aggregation": [
        {
            "function": "aggregate_ai_research_metadata",
            "table": "metadata",
            "args": {
                "deps": [
                    "get_ai_research_metadata"
                ]
            }
        },
        {
            "function": "aggregate_ai_research_pages",
            "table": "pages",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_page_info"
                ]
            }
        },
        {
            "function": "aggregate_ai_research_chunks",
            "table": "chunks",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_per_page_chunk_info",
                    "get_ai_research_page_info"
                ]
            }
        },
        {
            "function": "aggregate_ai_research_tables",
            "table": "tables",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_per_page_table_info",
                    "get_ai_research_page_info"
                ]
            }
        },
        {
            "function": "aggregate_ai_research_sections",
            "table": "sections",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_section_info"
                ]
            }
        },
        {
            "function": "aggregate_ai_research_images",
            "table": "images",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_per_page_image_info",
                    "get_ai_research_page_info"
                ]
            }
        },
        {
            "function": "aggregate_ai_research_equations",
            "table": "equations",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_per_page_equation_info",
                    "get_ai_research_page_info"
                ]
            }
        },
        {
            "function": "aggregate_ai_research_references",
            "table": "reference",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_reference_info"
                ]
            }
        }
    ]
}