{
    "uuid": {
        "function": "get_ai_research_metadata",
        "field": "uuid"
    },
    "pipeline": [
        {
            "function": "parallel_batch_to_dict",
            "args": {
                "deps": [],
                "kwargs": {
                    "input_path": "data/dataset/m3sciqa/parallel/text_results.jsonl",
                    "output_path": "data/dataset/m3sciqa/parallel/text_fill.json"
                }
            }
        },
        {
            "function": "parallel_batch_to_dict",
            "args": {
                "deps": [],
                "kwargs": {
                    "input_path": "data/dataset/m3sciqa/parallel/image_results.jsonl",
                    "output_path": "data/dataset/m3sciqa/parallel/image_fill.json"
                }
            }
        },
        {
            "function": "get_ai_research_metadata",
            "args": {
                "deps": [
                    "input_pdf"
                ],
                "kwargs": {
                    "model": "gpt-4o-mini",
                    "temperature": 0.1,
                    "api_tools": [],
                    "write_to_json": true,
                    "title_lines": 20,
                    "volume_lines": 10,
                    "tldr_max_length": 80,
                    "tag_number": 5,
                    "parallel": {
                        "fill": "data/dataset/m3sciqa/parallel/text_fill.json"
                    }
                }
            }
        },
        {
            "function": "get_ai_research_pdf_data",
            "args": {
                "deps": [
                    "get_ai_research_metadata"
                ],
                "kwargs": {
                    "processed_data_folder": "data/dataset/m3sciqa/processed_data",
                    "TOC_threshold": 0.9
                }
            }
        },
        {
            "function": "get_ai_research_page_info",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_pdf_data"
                ],
                "kwargs": {
                    "max_length": 50,
                    "model": "gpt-4o-mini",
                    "temperature": 0.1,
                    "top_p": 0.95,
                    "parallel": {
                        "fill": "data/dataset/m3sciqa/parallel/text_fill.json"
                    }
                }
            }
        },
        {
            "function": "get_ai_research_per_page_chunk_info",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_page_info"
                ],
                "kwargs": {
                    "chunk_size": 512,
                    "chunk_overlap": 0
                }
            }
        },
        {
            "function": "get_ai_research_section_info",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_pdf_data"
                ],
                "kwargs": {
                    "max_length": 50,
                    "model": "gpt-4o-mini",
                    "temperature": 0.1,
                    "top_p": 0.95,
                    "parallel": {
                        "fill": "data/dataset/m3sciqa/parallel/text_fill.json"
                    }
                }
            }
        },
        {
            "function": "get_ai_research_per_page_table_info",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_pdf_data"
                ],
                "kwargs": {
                    "max_length": 50,
                    "model": "gpt-4o-mini",
                    "temperature": 0.1,
                    "top_p": 0.95,
                    "parallel": {
                        "fill": "data/dataset/m3sciqa/parallel/text_fill.json"
                    }
                }
            }
        },
        {
            "function": "get_ai_research_per_page_image_info",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_pdf_data"
                ],
                "kwargs": {
                    "max_length": 50,
                    "model": "gpt-4o-mini",
                    "temperature": 0.1,
                    "top_p": 0.95,
                    "parallel": {
                        "fill": "data/dataset/m3sciqa/parallel/image_fill.json"
                    }
                }
            }
        },
        {
            "function": "get_ai_research_per_page_equation_info",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_pdf_data"
                ]
            }
        },
        {
            "function": "get_ai_research_reference_info",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_pdf_data",
                    "get_ai_research_page_info"
                ],
                "kwargs": {
                    "threshold": 0.9
                }
            }
        },
        {
            "function": "write_summary_json",
            "args": {
                "deps": [
                    "get_ai_research_metadata",
                    "get_ai_research_pdf_data",
                    "get_ai_research_page_info",
                    "get_ai_research_section_info",
                    "get_ai_research_per_page_table_info",
                    "get_ai_research_per_page_image_info"
                ],
                "kwargs": {
                    "processed_data_folder": "data/dataset/m3sciqa/processed_data"
                }
            }
        }
    ],
    "aggregation": []
}