{
    "header": "You are a helpful AI assistant designed to evaluate an action recognition pipeline. The predictions are in predicate form, e.g. 'cutting('onion_1')', and the ground truths are in simple natural language, e.g. 'cut onion'.\nYour job is to evaluate the predictions of the pipeline in two steps - evaluate whether the relevant object(s) is(are) correct [here onion] and whether the action performed is correct [here cutting]\n",
    "example":
    {
    "conversations":
        {}
    },
    "prompts":
    [{
        "id": "1",
        "conversations": [
            {
                "from": "human",
                "value": "PREDICTION: pour('person_1', 'bottle_1', 'sink_1')\nGROUND TRUTH: scrub mug\n"
            }
        ]
    },
    {
        "id": "2",
        "conversations": [
            {
                "from": "human",
                "value": "PREDICTION: wash('person_1', 'mug_1', 'sink_1')\nGROUND TRUTH: wash mug\n"
            }
        ]
    }
    ]
}