{"start_time": "2023-09-17 11:54:15", "temperature": 1.0, "top_p": 1.0, "check": true, "tool_graph": "graph_desc_multimedia.json", "tool_desc": "tools_desc_multimedia.json", "api_addr": "10.15.82.10", "api_port": 8002, "play": false, "method": null, "tool_number": null, "number_of_samples": 1000, "seed": 0, "output_dir": "result_20230917115415_tools_desc_multimedia_gpt-4_t1_0_p1_0_check", "save_figure": false, "multiworker": 5, "llm": "gpt-4"}
{"total": 100, "avg_time_per_sample": "0:00:07.680784", "success": 100, "fail": 0}
{"total": 200, "avg_time_per_sample": "0:00:07.838613", "success": 200, "fail": 0}
{"total": 300, "avg_time_per_sample": "0:00:07.655741", "success": 300, "fail": 0}
{"total": 400, "avg_time_per_sample": "0:00:07.605692", "success": 400, "fail": 0}
{"total": 500, "avg_time_per_sample": "0:00:07.704065", "success": 500, "fail": 0}
{"total": 600, "avg_time_per_sample": "0:00:07.794423", "success": 600, "fail": 0}
{"total": 700, "avg_time_per_sample": "0:00:07.722347", "success": 700, "fail": 0}
{"start_time": "2023-09-17 18:11:13", "temperature": 1.0, "top_p": 1.0, "check": true, "tool_graph": "graph_desc_multimedia.json", "tool_desc": "tools_desc_multimedia.json", "api_addr": "10.15.82.10", "api_port": 8002, "play": false, "method": null, "tool_number": null, "number_of_samples": 1000, "seed": 0, "output_dir": "result_20230917115415_tools_desc_multimedia_gpt-4_t1_0_p1_0_check", "save_figure": false, "multiworker": 10, "llm": "gpt-4"}
{"total": 100, "avg_time_per_sample": "0:00:04.869397", "success": 87, "fail": 13, "<class '__main__.RateLimitError'>": 12, "<class '__main__.ContentFormatError'>": 1}
{"total": 200, "avg_time_per_sample": "0:00:05.236272", "success": 170, "fail": 30, "<class '__main__.RateLimitError'>": 28, "<class '__main__.ContentFormatError'>": 2}
{"total": 300, "avg_time_per_sample": "0:00:05.315112", "success": 254, "fail": 46, "<class '__main__.RateLimitError'>": 42, "<class '__main__.ContentFormatError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 1}
{"total": 400, "avg_time_per_sample": "0:00:05.346313", "success": 339, "fail": 61, "<class '__main__.RateLimitError'>": 57, "<class '__main__.ContentFormatError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 1}
{"total": 500, "avg_time_per_sample": "0:00:05.344328", "success": 425, "fail": 75, "<class '__main__.RateLimitError'>": 70, "<class '__main__.ContentFormatError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 2}
{"total": 600, "avg_time_per_sample": "0:00:05.346085", "success": 512, "fail": 88, "<class '__main__.RateLimitError'>": 83, "<class '__main__.ContentFormatError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 2}
{"total": 700, "avg_time_per_sample": "0:00:05.324332", "success": 602, "fail": 98, "<class '__main__.RateLimitError'>": 93, "<class '__main__.ContentFormatError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 2}
{"total": 800, "avg_time_per_sample": "0:00:05.326868", "success": 683, "fail": 117, "<class '__main__.RateLimitError'>": 111, "<class '__main__.ContentFormatError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 2, "<class 'KeyError'>": 1}
{"total": 900, "avg_time_per_sample": "0:00:05.318307", "success": 773, "fail": 127, "<class '__main__.RateLimitError'>": 120, "<class '__main__.ContentFormatError'>": 4, "<class 'asyncio.exceptions.TimeoutError'>": 2, "<class 'KeyError'>": 1}
{"total": 1000, "avg_time_per_sample": "0:00:05.348572", "success": 857, "fail": 143, "<class '__main__.RateLimitError'>": 135, "<class '__main__.ContentFormatError'>": 5, "<class 'asyncio.exceptions.TimeoutError'>": 2, "<class 'KeyError'>": 1}
{"start_time": "2023-09-17 19:30:48", "temperature": 1.0, "top_p": 1.0, "check": true, "tool_graph": "graph_desc_multimedia.json", "tool_desc": "tools_desc_multimedia.json", "api_addr": "10.15.82.10", "api_port": 8002, "play": false, "method": null, "tool_number": null, "number_of_samples": 100, "seed": 0, "output_dir": "result_20230917115415_tools_desc_multimedia_gpt-4_t1_0_p1_0_check", "save_figure": false, "multiworker": 10, "llm": "gpt-4"}
{"total": 100, "avg_time_per_sample": "0:00:05.394157", "success": 89, "fail": 11, "<class '__main__.RateLimitError'>": 10, "<class 'KeyError'>": 1}
{"start_time": "2023-09-17 20:40:10", "temperature": 1.0, "top_p": 1.0, "check": true, "tool_graph": "graph_desc_multimedia.json", "tool_desc": "tools_desc_multimedia.json", "api_addr": "10.15.82.10", "api_port": 8002, "play": false, "method": null, "tool_number": null, "number_of_samples": 1000, "seed": 0, "output_dir": "result_20230917115415_tools_desc_multimedia_gpt-4_t1_0_p1_0_check", "save_figure": false, "multiworker": 10, "llm": "gpt-4"}
{"total": 100, "avg_time_per_sample": "0:00:05.638559", "success": 82, "fail": 18, "<class '__main__.RateLimitError'>": 17, "<class '__main__.ContentFormatError'>": 1}
{"total": 200, "avg_time_per_sample": "0:00:05.913246", "success": 159, "fail": 41, "<class '__main__.RateLimitError'>": 36, "<class '__main__.ContentFormatError'>": 4, "<class 'KeyError'>": 1}
{"total": 300, "avg_time_per_sample": "0:00:05.860773", "success": 239, "fail": 61, "<class '__main__.RateLimitError'>": 53, "<class '__main__.ContentFormatError'>": 5, "<class 'KeyError'>": 2, "<class 'asyncio.exceptions.TimeoutError'>": 1}
{"total": 400, "avg_time_per_sample": "0:00:05.823570", "success": 323, "fail": 77, "<class '__main__.RateLimitError'>": 68, "<class '__main__.ContentFormatError'>": 6, "<class 'KeyError'>": 2, "<class 'asyncio.exceptions.TimeoutError'>": 1}
{"total": 500, "avg_time_per_sample": "0:00:05.776520", "success": 409, "fail": 91, "<class '__main__.RateLimitError'>": 80, "<class '__main__.ContentFormatError'>": 8, "<class 'KeyError'>": 2, "<class 'asyncio.exceptions.TimeoutError'>": 1}
{"total": 600, "avg_time_per_sample": "0:00:05.746243", "success": 495, "fail": 105, "<class '__main__.RateLimitError'>": 92, "<class '__main__.ContentFormatError'>": 9, "<class 'KeyError'>": 2, "<class 'asyncio.exceptions.TimeoutError'>": 2}
{"total": 700, "avg_time_per_sample": "0:00:05.715770", "success": 579, "fail": 121, "<class '__main__.RateLimitError'>": 106, "<class '__main__.ContentFormatError'>": 11, "<class 'KeyError'>": 2, "<class 'asyncio.exceptions.TimeoutError'>": 2}
{"total": 800, "avg_time_per_sample": "0:00:05.688363", "success": 663, "fail": 137, "<class '__main__.RateLimitError'>": 122, "<class '__main__.ContentFormatError'>": 11, "<class 'KeyError'>": 2, "<class 'asyncio.exceptions.TimeoutError'>": 2}
{"total": 900, "avg_time_per_sample": "0:00:05.690999", "success": 746, "fail": 154, "<class '__main__.RateLimitError'>": 139, "<class '__main__.ContentFormatError'>": 11, "<class 'KeyError'>": 2, "<class 'asyncio.exceptions.TimeoutError'>": 2}
{"total": 1000, "avg_time_per_sample": "0:00:05.684739", "success": 834, "fail": 166, "<class '__main__.RateLimitError'>": 148, "<class '__main__.ContentFormatError'>": 14, "<class 'KeyError'>": 2, "<class 'asyncio.exceptions.TimeoutError'>": 2}
{"start_time": "2023-09-17 22:13:56", "temperature": 1.0, "top_p": 1.0, "check": true, "tool_graph": "graph_desc_multimedia.json", "tool_desc": "tools_desc_multimedia.json", "api_addr": "10.15.82.10", "api_port": 8002, "play": false, "method": null, "tool_number": null, "number_of_samples": 10000, "seed": 0, "output_dir": "result_20230917115415_tools_desc_multimedia_gpt-4_t1_0_p1_0_check", "save_figure": false, "multiworker": 10, "llm": "gpt-4"}
{"total": 100, "avg_time_per_sample": "0:00:05.263069", "success": 90, "fail": 10, "<class '__main__.RateLimitError'>": 9, "<class '__main__.ContentFormatError'>": 1}
{"total": 200, "avg_time_per_sample": "0:00:05.391122", "success": 177, "fail": 23, "<class '__main__.RateLimitError'>": 19, "<class '__main__.ContentFormatError'>": 2, "<class 'asyncio.exceptions.TimeoutError'>": 2}
{"total": 300, "avg_time_per_sample": "0:00:05.502713", "success": 260, "fail": 40, "<class '__main__.RateLimitError'>": 33, "<class '__main__.ContentFormatError'>": 4, "<class 'asyncio.exceptions.TimeoutError'>": 3}
{"total": 400, "avg_time_per_sample": "0:00:05.524784", "success": 346, "fail": 54, "<class '__main__.RateLimitError'>": 46, "<class '__main__.ContentFormatError'>": 5, "<class 'asyncio.exceptions.TimeoutError'>": 3}
{"total": 500, "avg_time_per_sample": "0:00:05.576193", "success": 431, "fail": 69, "<class '__main__.RateLimitError'>": 58, "<class '__main__.ContentFormatError'>": 8, "<class 'asyncio.exceptions.TimeoutError'>": 3}
{"total": 600, "avg_time_per_sample": "0:00:05.547943", "success": 520, "fail": 80, "<class '__main__.RateLimitError'>": 69, "<class '__main__.ContentFormatError'>": 8, "<class 'asyncio.exceptions.TimeoutError'>": 3}
{"total": 700, "avg_time_per_sample": "0:00:05.555535", "success": 603, "fail": 97, "<class '__main__.RateLimitError'>": 85, "<class '__main__.ContentFormatError'>": 9, "<class 'asyncio.exceptions.TimeoutError'>": 3}
{"total": 800, "avg_time_per_sample": "0:00:05.541672", "success": 687, "fail": 113, "<class '__main__.RateLimitError'>": 99, "<class '__main__.ContentFormatError'>": 11, "<class 'asyncio.exceptions.TimeoutError'>": 3}
{"total": 900, "avg_time_per_sample": "0:00:05.600364", "success": 769, "fail": 131, "<class '__main__.RateLimitError'>": 115, "<class '__main__.ContentFormatError'>": 12, "<class 'asyncio.exceptions.TimeoutError'>": 4}
{"total": 1000, "avg_time_per_sample": "0:00:05.626749", "success": 852, "fail": 148, "<class '__main__.RateLimitError'>": 128, "<class '__main__.ContentFormatError'>": 15, "<class 'asyncio.exceptions.TimeoutError'>": 5}
{"total": 1100, "avg_time_per_sample": "0:00:05.638367", "success": 940, "fail": 160, "<class '__main__.RateLimitError'>": 140, "<class '__main__.ContentFormatError'>": 15, "<class 'asyncio.exceptions.TimeoutError'>": 5}
{"total": 1200, "avg_time_per_sample": "0:00:05.628623", "success": 1028, "fail": 172, "<class '__main__.RateLimitError'>": 151, "<class '__main__.ContentFormatError'>": 16, "<class 'asyncio.exceptions.TimeoutError'>": 5}
{"total": 1300, "avg_time_per_sample": "0:00:05.637268", "success": 1119, "fail": 181, "<class '__main__.RateLimitError'>": 158, "<class '__main__.ContentFormatError'>": 17, "<class 'asyncio.exceptions.TimeoutError'>": 6}
{"total": 1400, "avg_time_per_sample": "0:00:05.696676", "success": 1206, "fail": 194, "<class '__main__.RateLimitError'>": 165, "<class '__main__.ContentFormatError'>": 18, "<class 'asyncio.exceptions.TimeoutError'>": 9, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2}
{"total": 1500, "avg_time_per_sample": "0:00:05.702345", "success": 1305, "fail": 195, "<class '__main__.RateLimitError'>": 166, "<class '__main__.ContentFormatError'>": 18, "<class 'asyncio.exceptions.TimeoutError'>": 9, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2}
{"total": 1600, "avg_time_per_sample": "0:00:05.948784", "success": 1374, "fail": 226, "<class '__main__.RateLimitError'>": 193, "<class '__main__.ContentFormatError'>": 20, "<class 'asyncio.exceptions.TimeoutError'>": 11, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2}
{"total": 1700, "avg_time_per_sample": "0:00:06.224618", "success": 1435, "fail": 265, "<class '__main__.RateLimitError'>": 228, "<class '__main__.ContentFormatError'>": 23, "<class 'asyncio.exceptions.TimeoutError'>": 12, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2}
{"total": 1800, "avg_time_per_sample": "0:00:06.400412", "success": 1515, "fail": 285, "<class '__main__.RateLimitError'>": 246, "<class '__main__.ContentFormatError'>": 23, "<class 'asyncio.exceptions.TimeoutError'>": 14, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2}
{"total": 1900, "avg_time_per_sample": "0:00:06.441017", "success": 1606, "fail": 294, "<class '__main__.RateLimitError'>": 253, "<class '__main__.ContentFormatError'>": 24, "<class 'asyncio.exceptions.TimeoutError'>": 14, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 1}
{"total": 2000, "avg_time_per_sample": "0:00:06.494757", "success": 1697, "fail": 303, "<class '__main__.RateLimitError'>": 261, "<class '__main__.ContentFormatError'>": 25, "<class 'asyncio.exceptions.TimeoutError'>": 14, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 1}
{"total": 2100, "avg_time_per_sample": "0:00:06.514965", "success": 1789, "fail": 311, "<class '__main__.RateLimitError'>": 269, "<class '__main__.ContentFormatError'>": 25, "<class 'asyncio.exceptions.TimeoutError'>": 14, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 1}
{"total": 2200, "avg_time_per_sample": "0:00:06.508107", "success": 1885, "fail": 315, "<class '__main__.RateLimitError'>": 272, "<class '__main__.ContentFormatError'>": 26, "<class 'asyncio.exceptions.TimeoutError'>": 14, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 1}
{"total": 2300, "avg_time_per_sample": "0:00:06.510685", "success": 1979, "fail": 321, "<class '__main__.RateLimitError'>": 277, "<class '__main__.ContentFormatError'>": 27, "<class 'asyncio.exceptions.TimeoutError'>": 14, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 1}
{"total": 2400, "avg_time_per_sample": "0:00:06.516235", "success": 2075, "fail": 325, "<class '__main__.RateLimitError'>": 280, "<class '__main__.ContentFormatError'>": 28, "<class 'asyncio.exceptions.TimeoutError'>": 14, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 1}
{"total": 2500, "avg_time_per_sample": "0:00:06.514734", "success": 2170, "fail": 330, "<class '__main__.RateLimitError'>": 284, "<class '__main__.ContentFormatError'>": 29, "<class 'asyncio.exceptions.TimeoutError'>": 14, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 1}
{"total": 2600, "avg_time_per_sample": "0:00:06.518818", "success": 2261, "fail": 339, "<class '__main__.RateLimitError'>": 288, "<class '__main__.ContentFormatError'>": 32, "<class 'asyncio.exceptions.TimeoutError'>": 15, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 2}
{"total": 2700, "avg_time_per_sample": "0:00:06.517663", "success": 2355, "fail": 345, "<class '__main__.RateLimitError'>": 292, "<class '__main__.ContentFormatError'>": 33, "<class 'asyncio.exceptions.TimeoutError'>": 16, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 2}
{"total": 2800, "avg_time_per_sample": "0:00:06.508798", "success": 2451, "fail": 349, "<class '__main__.RateLimitError'>": 294, "<class '__main__.ContentFormatError'>": 35, "<class 'asyncio.exceptions.TimeoutError'>": 16, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 2}
{"total": 2900, "avg_time_per_sample": "0:00:06.497314", "success": 2548, "fail": 352, "<class '__main__.RateLimitError'>": 295, "<class '__main__.ContentFormatError'>": 37, "<class 'asyncio.exceptions.TimeoutError'>": 16, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 2}
{"total": 3000, "avg_time_per_sample": "0:00:06.489737", "success": 2642, "fail": 358, "<class '__main__.RateLimitError'>": 300, "<class '__main__.ContentFormatError'>": 38, "<class 'asyncio.exceptions.TimeoutError'>": 16, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 2}
{"total": 3100, "avg_time_per_sample": "0:00:06.488468", "success": 2733, "fail": 367, "<class '__main__.RateLimitError'>": 307, "<class '__main__.ContentFormatError'>": 40, "<class 'asyncio.exceptions.TimeoutError'>": 16, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 2}
{"total": 3200, "avg_time_per_sample": "0:00:06.469462", "success": 2827, "fail": 373, "<class '__main__.RateLimitError'>": 312, "<class '__main__.ContentFormatError'>": 41, "<class 'asyncio.exceptions.TimeoutError'>": 16, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 2}
{"total": 3300, "avg_time_per_sample": "0:00:06.447103", "success": 2923, "fail": 377, "<class '__main__.RateLimitError'>": 314, "<class '__main__.ContentFormatError'>": 43, "<class 'asyncio.exceptions.TimeoutError'>": 16, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 2}
{"total": 3400, "avg_time_per_sample": "0:00:06.420805", "success": 3020, "fail": 380, "<class '__main__.RateLimitError'>": 316, "<class '__main__.ContentFormatError'>": 43, "<class 'asyncio.exceptions.TimeoutError'>": 17, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 2}
{"total": 3500, "avg_time_per_sample": "0:00:06.398359", "success": 3116, "fail": 384, "<class '__main__.RateLimitError'>": 319, "<class '__main__.ContentFormatError'>": 44, "<class 'asyncio.exceptions.TimeoutError'>": 17, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 2}
{"total": 3600, "avg_time_per_sample": "0:00:06.397480", "success": 3215, "fail": 385, "<class '__main__.RateLimitError'>": 319, "<class '__main__.ContentFormatError'>": 44, "<class 'asyncio.exceptions.TimeoutError'>": 18, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 2}
{"total": 3700, "avg_time_per_sample": "0:00:06.384353", "success": 3311, "fail": 389, "<class '__main__.RateLimitError'>": 321, "<class '__main__.ContentFormatError'>": 46, "<class 'asyncio.exceptions.TimeoutError'>": 18, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 2}
{"total": 3800, "avg_time_per_sample": "0:00:06.370665", "success": 3406, "fail": 394, "<class '__main__.RateLimitError'>": 323, "<class '__main__.ContentFormatError'>": 49, "<class 'asyncio.exceptions.TimeoutError'>": 18, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 2}
{"total": 3900, "avg_time_per_sample": "0:00:06.350501", "success": 3504, "fail": 396, "<class '__main__.RateLimitError'>": 324, "<class '__main__.ContentFormatError'>": 50, "<class 'asyncio.exceptions.TimeoutError'>": 18, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 2}
{"total": 4000, "avg_time_per_sample": "0:00:06.345627", "success": 3601, "fail": 399, "<class '__main__.RateLimitError'>": 327, "<class '__main__.ContentFormatError'>": 50, "<class 'asyncio.exceptions.TimeoutError'>": 18, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 2}
{"total": 4100, "avg_time_per_sample": "0:00:06.327470", "success": 3700, "fail": 400, "<class '__main__.RateLimitError'>": 328, "<class '__main__.ContentFormatError'>": 50, "<class 'asyncio.exceptions.TimeoutError'>": 18, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 2}
{"total": 4200, "avg_time_per_sample": "0:00:06.308712", "success": 3796, "fail": 404, "<class '__main__.RateLimitError'>": 330, "<class '__main__.ContentFormatError'>": 52, "<class 'asyncio.exceptions.TimeoutError'>": 18, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 2}
{"total": 4300, "avg_time_per_sample": "0:00:06.306838", "success": 3893, "fail": 407, "<class '__main__.RateLimitError'>": 332, "<class '__main__.ContentFormatError'>": 53, "<class 'asyncio.exceptions.TimeoutError'>": 18, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 2, "<class 'KeyError'>": 2}
{"temperature": 1.0, "top_p": 1.0, "check": true, "tool_graph": "graph_desc_multimedia.json", "tool_desc": "tools_desc_multimedia.json", "api_addr": "10.15.82.10", "api_port": 8002, "play": false, "method": null, "tool_number": null, "number_of_samples": 5000, "seed": -1, "output_dir": "result_20230917115415_tools_desc_multimedia_gpt-4_t1_0_p1_0_check", "save_figure": false, "multiworker": 3, "llm": "gpt-4", "use_async": true, "ignore_tool_type": false, "start_time": "2023-09-18 05:11:56"}
{"total": 100, "avg_time_per_sample": "0:00:18.492466", "success": 98, "fail": 2, "<class '__main__.ContentFormatError'>": 1, "<class '__main__.RateLimitError'>": 1}
{"temperature": 1.0, "top_p": 1.0, "check": true, "tool_graph": "graph_desc_multimedia.json", "tool_desc": "tools_desc_multimedia.json", "api_addr": "10.15.82.10", "api_port": 8002, "play": false, "method": null, "tool_number": null, "number_of_samples": 5000, "seed": -1, "output_dir": "result_20230917115415_tools_desc_multimedia_gpt-4_t1_0_p1_0_check", "save_figure": false, "multiworker": 3, "llm": "gpt-4", "use_async": true, "ignore_tool_type": false, "start_time": "2023-09-18 10:44:47"}
{"total": 100, "avg_time_per_sample": "0:00:25.773789", "success": 98, "fail": 2, "<class '__main__.ContentFormatError'>": 2}
{"total": 200, "avg_time_per_sample": "0:00:25.460098", "success": 195, "fail": 5, "<class '__main__.ContentFormatError'>": 4, "<class 'asyncio.exceptions.TimeoutError'>": 1}
{"total": 300, "avg_time_per_sample": "0:00:27.356164", "success": 286, "fail": 14, "<class '__main__.ContentFormatError'>": 5, "<class 'asyncio.exceptions.TimeoutError'>": 6, "<class '__main__.RateLimitError'>": 3}
{"total": 400, "avg_time_per_sample": "0:00:29.125220", "success": 373, "fail": 27, "<class '__main__.ContentFormatError'>": 6, "<class 'asyncio.exceptions.TimeoutError'>": 16, "<class '__main__.RateLimitError'>": 5}
{"total": 500, "avg_time_per_sample": "0:00:30.997040", "success": 453, "fail": 47, "<class '__main__.ContentFormatError'>": 6, "<class 'asyncio.exceptions.TimeoutError'>": 31, "<class '__main__.RateLimitError'>": 10}
{"total": 600, "avg_time_per_sample": "0:00:32.875587", "success": 526, "fail": 74, "<class '__main__.ContentFormatError'>": 6, "<class 'asyncio.exceptions.TimeoutError'>": 54, "<class '__main__.RateLimitError'>": 13, "<class 'KeyError'>": 1}
{"total": 700, "avg_time_per_sample": "0:00:34.133398", "success": 602, "fail": 98, "<class '__main__.ContentFormatError'>": 7, "<class 'asyncio.exceptions.TimeoutError'>": 77, "<class '__main__.RateLimitError'>": 13, "<class 'KeyError'>": 1}
{"total": 800, "avg_time_per_sample": "0:00:34.075003", "success": 689, "fail": 111, "<class '__main__.ContentFormatError'>": 7, "<class 'asyncio.exceptions.TimeoutError'>": 87, "<class '__main__.RateLimitError'>": 16, "<class 'KeyError'>": 1}
{"total": 900, "avg_time_per_sample": "0:00:31.379992", "success": 787, "fail": 113, "<class '__main__.ContentFormatError'>": 9, "<class 'asyncio.exceptions.TimeoutError'>": 87, "<class '__main__.RateLimitError'>": 16, "<class 'KeyError'>": 1}
{"total": 1000, "avg_time_per_sample": "0:00:29.273185", "success": 886, "fail": 114, "<class '__main__.ContentFormatError'>": 10, "<class 'asyncio.exceptions.TimeoutError'>": 87, "<class '__main__.RateLimitError'>": 16, "<class 'KeyError'>": 1}
{"total": 1100, "avg_time_per_sample": "0:00:27.558860", "success": 985, "fail": 115, "<class '__main__.ContentFormatError'>": 11, "<class 'asyncio.exceptions.TimeoutError'>": 87, "<class '__main__.RateLimitError'>": 16, "<class 'KeyError'>": 1}
{"total": 1200, "avg_time_per_sample": "0:00:26.108732", "success": 1085, "fail": 115, "<class '__main__.ContentFormatError'>": 11, "<class 'asyncio.exceptions.TimeoutError'>": 87, "<class '__main__.RateLimitError'>": 16, "<class 'KeyError'>": 1}
{"total": 1300, "avg_time_per_sample": "0:00:24.991776", "success": 1183, "fail": 117, "<class '__main__.ContentFormatError'>": 13, "<class 'asyncio.exceptions.TimeoutError'>": 87, "<class '__main__.RateLimitError'>": 16, "<class 'KeyError'>": 1}
{"total": 1400, "avg_time_per_sample": "0:00:24.038322", "success": 1280, "fail": 120, "<class '__main__.ContentFormatError'>": 16, "<class 'asyncio.exceptions.TimeoutError'>": 87, "<class '__main__.RateLimitError'>": 16, "<class 'KeyError'>": 1}
{"total": 1500, "avg_time_per_sample": "0:00:23.228270", "success": 1379, "fail": 121, "<class '__main__.ContentFormatError'>": 17, "<class 'asyncio.exceptions.TimeoutError'>": 87, "<class '__main__.RateLimitError'>": 16, "<class 'KeyError'>": 1}
{"total": 1600, "avg_time_per_sample": "0:00:24.956090", "success": 1411, "fail": 189, "<class '__main__.ContentFormatError'>": 17, "<class 'asyncio.exceptions.TimeoutError'>": 155, "<class '__main__.RateLimitError'>": 16, "<class 'KeyError'>": 1}
{"total": 1700, "avg_time_per_sample": "0:00:27.179748", "success": 1419, "fail": 281, "<class '__main__.ContentFormatError'>": 17, "<class 'asyncio.exceptions.TimeoutError'>": 247, "<class '__main__.RateLimitError'>": 16, "<class 'KeyError'>": 1}
{"temperature": 1.0, "top_p": 1.0, "check": true, "tool_graph": "graph_desc_multimedia.json", "tool_desc": "tools_desc_multimedia.json", "api_addr": "10.15.82.10", "api_port": 8002, "play": false, "method": null, "tool_number": null, "number_of_samples": 7000, "seed": -1, "output_dir": "result_20230917115415_tools_desc_multimedia_gpt-4_t1_0_p1_0_check", "save_figure": false, "multiworker": 2, "llm": "gpt-4", "use_async": true, "ignore_tool_type": false, "start_time": "2023-09-19 00:46:57"}
{"total": 100, "avg_time_per_sample": "0:00:27.115795", "success": 89, "fail": 11, "<class '__main__.RateLimitError'>": 9, "<class '__main__.ContentFormatError'>": 2}
{"total": 200, "avg_time_per_sample": "0:00:28.578145", "success": 172, "fail": 28, "<class '__main__.RateLimitError'>": 25, "<class '__main__.ContentFormatError'>": 2, "<class 'KeyError'>": 1}
{"total": 300, "avg_time_per_sample": "0:00:30.734945", "success": 248, "fail": 52, "<class '__main__.RateLimitError'>": 46, "<class '__main__.ContentFormatError'>": 4, "<class 'KeyError'>": 2}
{"total": 400, "avg_time_per_sample": "0:00:32.058337", "success": 328, "fail": 72, "<class '__main__.RateLimitError'>": 65, "<class '__main__.ContentFormatError'>": 5, "<class 'KeyError'>": 2}
{"total": 500, "avg_time_per_sample": "0:00:34.162180", "success": 389, "fail": 111, "<class '__main__.RateLimitError'>": 103, "<class '__main__.ContentFormatError'>": 6, "<class 'KeyError'>": 2}
{"total": 600, "avg_time_per_sample": "0:00:34.371316", "success": 470, "fail": 130, "<class '__main__.RateLimitError'>": 121, "<class '__main__.ContentFormatError'>": 7, "<class 'KeyError'>": 2}
{"total": 700, "avg_time_per_sample": "0:00:34.516555", "success": 548, "fail": 152, "<class '__main__.RateLimitError'>": 141, "<class '__main__.ContentFormatError'>": 9, "<class 'KeyError'>": 2}
{"total": 800, "avg_time_per_sample": "0:00:34.119824", "success": 633, "fail": 167, "<class '__main__.RateLimitError'>": 156, "<class '__main__.ContentFormatError'>": 9, "<class 'KeyError'>": 2}
{"total": 900, "avg_time_per_sample": "0:00:34.458678", "success": 709, "fail": 191, "<class '__main__.RateLimitError'>": 179, "<class '__main__.ContentFormatError'>": 10, "<class 'KeyError'>": 2}
{"total": 1000, "avg_time_per_sample": "0:00:34.327870", "success": 788, "fail": 212, "<class '__main__.RateLimitError'>": 200, "<class '__main__.ContentFormatError'>": 10, "<class 'KeyError'>": 2}
{"total": 1100, "avg_time_per_sample": "0:00:34.491414", "success": 865, "fail": 235, "<class '__main__.RateLimitError'>": 222, "<class '__main__.ContentFormatError'>": 11, "<class 'KeyError'>": 2}
{"total": 1200, "avg_time_per_sample": "0:00:34.956720", "success": 932, "fail": 268, "<class '__main__.RateLimitError'>": 255, "<class '__main__.ContentFormatError'>": 11, "<class 'KeyError'>": 2}
{"total": 1300, "avg_time_per_sample": "0:00:35.253649", "success": 1004, "fail": 296, "<class '__main__.RateLimitError'>": 282, "<class '__main__.ContentFormatError'>": 12, "<class 'KeyError'>": 2}
{"total": 1400, "avg_time_per_sample": "0:00:36.827351", "success": 1047, "fail": 353, "<class '__main__.RateLimitError'>": 336, "<class '__main__.ContentFormatError'>": 13, "<class 'KeyError'>": 2, "<class 'asyncio.exceptions.TimeoutError'>": 2}
{"total": 1500, "avg_time_per_sample": "0:00:38.339434", "success": 1087, "fail": 413, "<class '__main__.RateLimitError'>": 394, "<class '__main__.ContentFormatError'>": 15, "<class 'KeyError'>": 2, "<class 'asyncio.exceptions.TimeoutError'>": 2}
{"total": 1600, "avg_time_per_sample": "0:00:39.832710", "success": 1124, "fail": 476, "<class '__main__.RateLimitError'>": 457, "<class '__main__.ContentFormatError'>": 15, "<class 'KeyError'>": 2, "<class 'asyncio.exceptions.TimeoutError'>": 2}
