{
    "uuid": "9f506412-ee1f-5e65-af24-4f2a07fa9948",
    "question": "Which object detector does this paper(titled \"Can VLMs Play Action Role-Playing Games? Take Black Myth Wukong as a Study Case\") use to assist the VLMs in better extracting useful information?On which datasets is this object detector pre-trained?",
    "answer_format": "Your answer should be a list like [\"detector_name\", [\"dataset1\",\"dataset2\",...]], where detector_name is the name of the object detector and [\"dataset1\",\"dataset2\",...] is a list of dataset names(abbreviation) on which the object detector is pre-trained.",
    "tags": [
        "multiple",
        "text",
        "table",
        "objective"
    ],
    "anchor_pdf": [
        "c4b97d0c-1f8b-5e9e-80f6-3e02de9cc3c6"
    ],
    "reference_pdf": [
        "e463d3fd-66ac-5c70-9991-21a3987776d2"
    ],
    "conference": [],
    "reasoning_steps": [],
    "evaluator": {
        "eval_func": "eval_conjunction",
        "eval_kwargs": {
            "eval_func_list": [
                "eval_string_exact_match",
                "eval_structured_object_exact_match"
            ],
            "eval_kwargs_list": [
                {
                    "gold": "Grounding DINO",
                    "lowercase": true
                },
                {
                    "gold": [
                        "O365",
                        "OI",
                        "GoldG",
                        "COCO",
                        "Cap4M",
                        "RefC"
                    ],
                    "ignore_order": true,
                    "lowercase": true
                }
            ]
        }
    },
    "state": {
        "gui-gpt-4o-2024-11-20": false
    },
    "annotator": "human"
}