[{"id": "CharXiv_13_23", "dataset_name": "CharXiv", "image": "CharXiv_13_23.jpg", "source": "dev", "task": "Arithmetic Reasoning", "question": "For the subplot at row 5 and column 2, what is the difference between the maximum and minimum values of the tick labels on the continuous legend (i.e., colorbar)?\n        * You should remove the percentage sign (if any) in your answer.\n        * If the plot does not have an explicit colorbar-based continuous legend or the legend is not considered relevant to this subplot, answer \"Not Applicable\".", "ground_truth": [{"answer": "0.8", "bbox": [], "supporting_evidence": [{"text": "1.6", "bbox": [365, 24, 408, 44]}, {"text": "2.4", "bbox": [539, 24, 582, 46]}]}]}, {"id": "CharXiv_13_104", "dataset_name": "CharXiv", "image": "CharXiv_13_104.jpg", "source": "dev", "task": "Arithmetic Reasoning", "question": "What is the approximate difference in key rate between n = 10^7 and n = 10^15 at a QBER of 0%?\n    * Your final answer must be a number with 1 decimal places.\n    ", "ground_truth": [{"answer": "0.6", "bbox": [], "supporting_evidence": [{"text": "0.4", "bbox": [61, 483, 169, 515]}, {"text": "1", "bbox": [85, 332, 161, 357]}]}]}, {"id": "DUDE_10_20", "dataset_name": "DUDE", "image": "DUDE_10_20.jpg", "source": "dev", "task": "Arithmetic Reasoning", "question": "How many years did William Perry Pendley acted as a president?", "ground_truth": [{"answer": "29 years", "bbox": [], "supporting_evidence": [{"text": "1989 - 2018", "bbox": [741, 145, 835, 160]}]}]}, {"id": "DUDE_10_100", "dataset_name": "DUDE", "image": "DUDE_10_100.jpg", "source": "dev", "task": "Arithmetic Reasoning", "question": "What is the percentage of men in the labor force in the document?", "ground_truth": [{"answer": "53%", "bbox": [], "supporting_evidence": [{"text": "(47%),", "bbox": [280, 266, 377, 275]}]}]}, {"id": "InfographicVQA_14_29", "dataset_name": "InfographicVQA", "image": "InfographicVQA_14_29.jpg", "source": "test", "task": "Arithmetic Reasoning", "question": "How much more is the value of sales from marijuana, when compared to that from cocaine($m)?", "ground_truth": [{"answer": "0.5", "bbox": [], "supporting_evidence": [{"text": "5.2", "bbox": [369, 261, 406, 280]}, {"text": "5.7", "bbox": [583, 256, 620, 277]}]}]}, {"id": "InfographicVQA_14_148", "dataset_name": "InfographicVQA", "image": "InfographicVQA_14_148.jpg", "source": "test", "task": "Arithmetic Reasoning", "question": "What is the combined percentage of zinc and copper, taken together?", "ground_truth": [{"answer": "100%", "bbox": [], "supporting_evidence": [{"text": "97.5%", "bbox": [354, 864, 417, 870]}, {"text": "2.5%", "bbox": [472, 864, 522, 870]}]}]}, {"id": "TAT-DQA_12_62", "dataset_name": "TAT-DQA", "image": "TAT-DQA_12_62.png", "source": "test", "task": "Arithmetic Reasoning", "question": "What is the percentage change in total segment net revenues between 2018 and 2019?", "ground_truth": [{"answer": "-12.67%", "bbox": [], "supporting_evidence": [{"text": "6,835", "bbox": [876, 430, 913, 444]}, {"text": "5,969", "bbox": [876, 273, 913, 287]}]}]}, {"id": "TAT-DQA_12_228", "dataset_name": "TAT-DQA", "image": "TAT-DQA_12_228.png", "source": "test", "task": "Arithmetic Reasoning", "question": "What was the change in the amount for contracts within one year?", "ground_truth": [{"answer": "2.8", "bbox": [], "supporting_evidence": [{"text": "18.3", "bbox": [836, 830, 866, 841]}, {"text": "15.5", "bbox": [918, 829, 945, 842]}]}]}, {"id": "WTQ_11_20", "dataset_name": "WTQ", "image": "WTQ_11_20.jpg", "source": "test", "task": "Arithmetic Reasoning", "question": "what is the difference in time between when cosmo-bot was and slobot?", "ground_truth": [{"answer": "143 years", "bbox": [], "supporting_evidence": [{"text": "1531", "bbox": [536, 61, 566, 78]}, {"text": "1674", "bbox": [536, 584, 567, 602]}]}]}, {"id": "WTQ_11_31", "dataset_name": "WTQ", "image": "WTQ_11_31.jpg", "source": "test", "task": "Arithmetic Reasoning", "question": "how long did charlie sheen go without a nomination after 2008?", "ground_truth": [{"answer": "2 years", "bbox": [], "supporting_evidence": [{"text": "2008", "bbox": [16, 792, 50, 812]}, {"text": "2010", "bbox": [16, 878, 50, 897]}]}]}]