{
    "pipeline": [
        {
            "function": "get_ai_research_metadata",
            "args": {
                "deps": [
                    "input_pdf"
                ],
                "kwargs": {
                    "tldr_max_length": 80,
                    "tag_number": 5,
                    "parallel": {
                        "extract": "data/dataset/airqa/parallel/text_extract.jsonl"
                    }
                }
            }
        },
        {
            "function": "get_ai_research_pdf_data",
            "args": {
                "deps": [
                    "get_ai_research_metadata"
                ],
                "kwargs": {
                    "processed_data_folder": "data/dataset/airqa/processed_data",
                    "TOC_threshold": 0.9
                }
            }
        },
        {
            "function": "get_ai_research_page_info",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_pdf_data"
                ],
                "kwargs": {
                    "max_length": 50,
                    "parallel": {
                        "extract": "data/dataset/airqa/parallel/text_extract.jsonl"
                    }
                }
            }
        },
        {
            "function": "get_ai_research_section_info",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_pdf_data"
                ],
                "kwargs": {
                    "max_length": 50,
                    "parallel": {
                        "extract": "data/dataset/airqa/parallel/text_extract.jsonl"
                    }
                }
            }
        },
        {
            "function": "get_ai_research_per_page_table_info",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_pdf_data"
                ],
                "kwargs": {
                    "max_length": 50,
                    "parallel": {
                        "extract": "data/dataset/airqa/parallel/text_extract.jsonl"
                    }
                }
            }
        },
        {
            "function": "get_ai_research_per_page_image_info",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_pdf_data"
                ],
                "kwargs": {
                    "max_length": 50,
                    "parallel": {
                        "extract": "data/dataset/airqa/parallel/image_extract.jsonl"
                    }
                }
            }
        },
        {
            "function": "parallel_message_to_batch",
            "args": {
                "deps": [],
                "kwargs": {
                    "input_path": "data/dataset/airqa/parallel/text_extract.jsonl",
                    "output_path": "data/dataset/airqa/parallel/text_batch.jsonl",
                    "model": "qwen2.5-72b-instruct"
                }
            }
        },
        {
            "function": "parallel_message_to_batch",
            "args": {
                "deps": [],
                "kwargs": {
                    "input_path": "data/dataset/airqa/parallel/image_extract.jsonl",
                    "output_path": "data/dataset/airqa/parallel/image_batch.jsonl",
                    "model": "qwen2-vl-72b-instruct"
                }
            }
        }
    ],
    "aggregation": []
}