{"start_time": "2023-09-18 04:53:36", "temperature": 1.0, "top_p": 1.0, "check": true, "tool_graph": "graph_desc_apis.json", "tool_desc": "tools_desc_apis.json", "api_addr": "10.15.82.10", "api_port": 8002, "play": false, "method": null, "tool_number": null, "number_of_samples": 100, "seed": 0, "output_dir": "result_20230918045336_tools_desc_apis_gpt-4_t1_0_p1_0_check", "save_figure": false, "multiworker": 1, "llm": "gpt-4"}
{"temperature": 1.0, "top_p": 1.0, "check": true, "tool_graph": "graph_desc_apis.json", "tool_desc": "tools_desc_apis.json", "api_addr": "10.15.82.10", "api_port": 8002, "play": false, "method": null, "tool_number": null, "number_of_samples": 100, "seed": -1, "output_dir": "result_20230918045336_tools_desc_apis_gpt-4_t1_0_p1_0_check", "save_figure": false, "multiworker": 1, "llm": "gpt-4", "use_async": true, "ignore_tool_type": true, "start_time": "2023-09-18 05:04:14"}
{"temperature": 1.0, "top_p": 1.0, "check": true, "tool_graph": "graph_desc_apis.json", "tool_desc": "tools_desc_apis.json", "api_addr": "10.15.82.10", "api_port": 8002, "play": false, "method": null, "tool_number": null, "number_of_samples": 10, "seed": -1, "output_dir": "result_20230918045336_tools_desc_apis_gpt-4_t1_0_p1_0_check", "save_figure": false, "multiworker": 1, "llm": "gpt-4", "use_async": false, "ignore_tool_type": true, "start_time": "2023-09-18 05:04:28"}
{"temperature": 1.0, "top_p": 1.0, "check": true, "tool_graph": "graph_desc_apis.json", "tool_desc": "tools_desc_apis.json", "api_addr": "10.15.82.10", "api_port": 8002, "play": false, "method": null, "tool_number": null, "number_of_samples": 5000, "seed": -1, "output_dir": "result_20230918045336_tools_desc_apis_gpt-4_t1_0_p1_0_check", "save_figure": false, "multiworker": 8, "llm": "gpt-4", "use_async": true, "ignore_tool_type": true, "start_time": "2023-09-18 05:13:54"}
{"total": 100, "avg_time_per_sample": "0:00:08.207549", "success": 97, "fail": 3, "<class '__main__.ContentFormatError'>": 2, "<class '__main__.RateLimitError'>": 1}
{"total": 200, "avg_time_per_sample": "0:00:08.320668", "success": 194, "fail": 6, "<class '__main__.ContentFormatError'>": 3, "<class '__main__.RateLimitError'>": 3}
{"total": 300, "avg_time_per_sample": "0:00:07.902064", "success": 288, "fail": 12, "<class '__main__.ContentFormatError'>": 8, "<class '__main__.RateLimitError'>": 4}
{"total": 400, "avg_time_per_sample": "0:00:07.491399", "success": 383, "fail": 17, "<class '__main__.ContentFormatError'>": 12, "<class '__main__.RateLimitError'>": 5}
{"total": 500, "avg_time_per_sample": "0:00:07.259123", "success": 479, "fail": 21, "<class '__main__.ContentFormatError'>": 16, "<class '__main__.RateLimitError'>": 5}
{"total": 600, "avg_time_per_sample": "0:00:07.036882", "success": 578, "fail": 22, "<class '__main__.ContentFormatError'>": 17, "<class '__main__.RateLimitError'>": 5}
{"total": 700, "avg_time_per_sample": "0:00:06.949604", "success": 675, "fail": 25, "<class '__main__.ContentFormatError'>": 20, "<class '__main__.RateLimitError'>": 5}
{"total": 800, "avg_time_per_sample": "0:00:06.891096", "success": 774, "fail": 26, "<class '__main__.ContentFormatError'>": 21, "<class '__main__.RateLimitError'>": 5}
{"total": 900, "avg_time_per_sample": "0:00:06.851390", "success": 872, "fail": 28, "<class '__main__.ContentFormatError'>": 23, "<class '__main__.RateLimitError'>": 5}
{"total": 1000, "avg_time_per_sample": "0:00:06.825729", "success": 969, "fail": 31, "<class '__main__.ContentFormatError'>": 25, "<class '__main__.RateLimitError'>": 6}
{"total": 1100, "avg_time_per_sample": "0:00:06.783878", "success": 1066, "fail": 34, "<class '__main__.ContentFormatError'>": 28, "<class '__main__.RateLimitError'>": 6}
{"total": 1200, "avg_time_per_sample": "0:00:06.740813", "success": 1163, "fail": 37, "<class '__main__.ContentFormatError'>": 30, "<class '__main__.RateLimitError'>": 7}
{"total": 1300, "avg_time_per_sample": "0:00:06.711025", "success": 1262, "fail": 38, "<class '__main__.ContentFormatError'>": 31, "<class '__main__.RateLimitError'>": 7}
{"total": 1400, "avg_time_per_sample": "0:00:06.719584", "success": 1360, "fail": 40, "<class '__main__.ContentFormatError'>": 33, "<class '__main__.RateLimitError'>": 7}
{"total": 1500, "avg_time_per_sample": "0:00:06.691437", "success": 1459, "fail": 41, "<class '__main__.ContentFormatError'>": 34, "<class '__main__.RateLimitError'>": 7}
{"total": 1600, "avg_time_per_sample": "0:00:06.690764", "success": 1556, "fail": 44, "<class '__main__.ContentFormatError'>": 37, "<class '__main__.RateLimitError'>": 7}
{"total": 1700, "avg_time_per_sample": "0:00:06.686329", "success": 1654, "fail": 46, "<class '__main__.ContentFormatError'>": 39, "<class '__main__.RateLimitError'>": 7}
{"total": 1800, "avg_time_per_sample": "0:00:06.665371", "success": 1753, "fail": 47, "<class '__main__.ContentFormatError'>": 40, "<class '__main__.RateLimitError'>": 7}
{"total": 1900, "avg_time_per_sample": "0:00:06.632352", "success": 1851, "fail": 49, "<class '__main__.ContentFormatError'>": 42, "<class '__main__.RateLimitError'>": 7}
{"total": 2000, "avg_time_per_sample": "0:00:06.605534", "success": 1950, "fail": 50, "<class '__main__.ContentFormatError'>": 43, "<class '__main__.RateLimitError'>": 7}
{"total": 2100, "avg_time_per_sample": "0:00:06.584712", "success": 2048, "fail": 52, "<class '__main__.ContentFormatError'>": 44, "<class '__main__.RateLimitError'>": 8}
{"total": 2200, "avg_time_per_sample": "0:00:06.566294", "success": 2146, "fail": 54, "<class '__main__.ContentFormatError'>": 46, "<class '__main__.RateLimitError'>": 8}
{"total": 2300, "avg_time_per_sample": "0:00:06.538969", "success": 2244, "fail": 56, "<class '__main__.ContentFormatError'>": 48, "<class '__main__.RateLimitError'>": 8}
{"total": 2400, "avg_time_per_sample": "0:00:06.531883", "success": 2343, "fail": 57, "<class '__main__.ContentFormatError'>": 48, "<class '__main__.RateLimitError'>": 8, "<class 'KeyError'>": 1}
{"total": 2500, "avg_time_per_sample": "0:00:06.516551", "success": 2440, "fail": 60, "<class '__main__.ContentFormatError'>": 48, "<class '__main__.RateLimitError'>": 8, "<class 'KeyError'>": 2, "<class 'asyncio.exceptions.TimeoutError'>": 2}
{"total": 2600, "avg_time_per_sample": "0:00:06.510111", "success": 2539, "fail": 61, "<class '__main__.ContentFormatError'>": 48, "<class '__main__.RateLimitError'>": 8, "<class 'KeyError'>": 2, "<class 'asyncio.exceptions.TimeoutError'>": 3}
{"total": 2700, "avg_time_per_sample": "0:00:06.552576", "success": 2633, "fail": 67, "<class '__main__.ContentFormatError'>": 52, "<class '__main__.RateLimitError'>": 9, "<class 'KeyError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 3}
{"total": 2800, "avg_time_per_sample": "0:00:06.607366", "success": 2733, "fail": 67, "<class '__main__.ContentFormatError'>": 52, "<class '__main__.RateLimitError'>": 9, "<class 'KeyError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 3}
{"total": 2900, "avg_time_per_sample": "0:00:06.658762", "success": 2833, "fail": 67, "<class '__main__.ContentFormatError'>": 52, "<class '__main__.RateLimitError'>": 9, "<class 'KeyError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 3}
{"total": 3000, "avg_time_per_sample": "0:00:06.698204", "success": 2931, "fail": 69, "<class '__main__.ContentFormatError'>": 53, "<class '__main__.RateLimitError'>": 9, "<class 'KeyError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 4}
{"total": 3100, "avg_time_per_sample": "0:00:06.835559", "success": 3026, "fail": 74, "<class '__main__.ContentFormatError'>": 53, "<class '__main__.RateLimitError'>": 9, "<class 'KeyError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 9}
{"total": 3200, "avg_time_per_sample": "0:00:06.929762", "success": 3122, "fail": 78, "<class '__main__.ContentFormatError'>": 56, "<class '__main__.RateLimitError'>": 9, "<class 'KeyError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 10}
{"total": 3300, "avg_time_per_sample": "0:00:07.035037", "success": 3220, "fail": 80, "<class '__main__.ContentFormatError'>": 57, "<class '__main__.RateLimitError'>": 9, "<class 'KeyError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 11}
{"total": 3400, "avg_time_per_sample": "0:00:07.143802", "success": 3315, "fail": 85, "<class '__main__.ContentFormatError'>": 58, "<class '__main__.RateLimitError'>": 9, "<class 'KeyError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 15}
{"total": 3500, "avg_time_per_sample": "0:00:07.220711", "success": 3413, "fail": 87, "<class '__main__.ContentFormatError'>": 59, "<class '__main__.RateLimitError'>": 9, "<class 'KeyError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 16}
{"total": 3600, "avg_time_per_sample": "0:00:07.346786", "success": 3503, "fail": 97, "<class '__main__.ContentFormatError'>": 60, "<class '__main__.RateLimitError'>": 11, "<class 'KeyError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 23}
{"total": 3700, "avg_time_per_sample": "0:00:07.463077", "success": 3594, "fail": 106, "<class '__main__.ContentFormatError'>": 61, "<class '__main__.RateLimitError'>": 12, "<class 'KeyError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 30}
{"total": 3800, "avg_time_per_sample": "0:00:07.603695", "success": 3678, "fail": 122, "<class '__main__.ContentFormatError'>": 62, "<class '__main__.RateLimitError'>": 15, "<class 'KeyError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 42}
{"total": 3900, "avg_time_per_sample": "0:00:07.772831", "success": 3751, "fail": 149, "<class '__main__.ContentFormatError'>": 65, "<class '__main__.RateLimitError'>": 19, "<class 'KeyError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 62}
{"total": 4000, "avg_time_per_sample": "0:00:07.911649", "success": 3834, "fail": 166, "<class '__main__.ContentFormatError'>": 67, "<class '__main__.RateLimitError'>": 23, "<class 'KeyError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 73}
{"total": 4100, "avg_time_per_sample": "0:00:08.041495", "success": 3916, "fail": 184, "<class '__main__.ContentFormatError'>": 68, "<class '__main__.RateLimitError'>": 25, "<class 'KeyError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 88}
{"total": 4200, "avg_time_per_sample": "0:00:08.242647", "success": 3981, "fail": 219, "<class '__main__.ContentFormatError'>": 70, "<class '__main__.RateLimitError'>": 30, "<class 'KeyError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 116}
{"total": 4300, "avg_time_per_sample": "0:00:08.424216", "success": 4046, "fail": 254, "<class '__main__.ContentFormatError'>": 72, "<class '__main__.RateLimitError'>": 35, "<class 'KeyError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 144}
{"total": 4400, "avg_time_per_sample": "0:00:08.605306", "success": 4112, "fail": 288, "<class '__main__.ContentFormatError'>": 74, "<class '__main__.RateLimitError'>": 38, "<class 'KeyError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 173}
{"total": 4500, "avg_time_per_sample": "0:00:08.744408", "success": 4184, "fail": 316, "<class '__main__.ContentFormatError'>": 76, "<class '__main__.RateLimitError'>": 41, "<class 'KeyError'>": 3, "<class 'asyncio.exceptions.TimeoutError'>": 196}
{"total": 4600, "avg_time_per_sample": "0:00:08.942568", "success": 4240, "fail": 360, "<class '__main__.ContentFormatError'>": 77, "<class '__main__.RateLimitError'>": 43, "<class 'KeyError'>": 4, "<class 'asyncio.exceptions.TimeoutError'>": 236}
{"total": 4700, "avg_time_per_sample": "0:00:09.079665", "success": 4316, "fail": 384, "<class '__main__.ContentFormatError'>": 78, "<class '__main__.RateLimitError'>": 43, "<class 'KeyError'>": 5, "<class 'asyncio.exceptions.TimeoutError'>": 258}
{"total": 4800, "avg_time_per_sample": "0:00:09.200383", "success": 4392, "fail": 408, "<class '__main__.ContentFormatError'>": 79, "<class '__main__.RateLimitError'>": 46, "<class 'KeyError'>": 5, "<class 'asyncio.exceptions.TimeoutError'>": 278}
{"total": 4900, "avg_time_per_sample": "0:00:09.394517", "success": 4448, "fail": 452, "<class '__main__.ContentFormatError'>": 81, "<class '__main__.RateLimitError'>": 47, "<class 'KeyError'>": 5, "<class 'asyncio.exceptions.TimeoutError'>": 318, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 1}
{"total": 5000, "avg_time_per_sample": "0:00:09.531990", "success": 4518, "fail": 482, "<class '__main__.ContentFormatError'>": 82, "<class '__main__.RateLimitError'>": 48, "<class 'KeyError'>": 5, "<class 'asyncio.exceptions.TimeoutError'>": 346, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 1}
{"temperature": 1.0, "top_p": 1.0, "check": true, "tool_graph": "graph_desc_apis.json", "tool_desc": "tools_desc_apis.json", "api_addr": "10.15.82.10", "api_port": 8002, "play": false, "method": null, "tool_number": null, "number_of_samples": 7000, "seed": -1, "output_dir": "result_20230918045336_tools_desc_apis_gpt-4_t1_0_p1_0_check", "save_figure": false, "multiworker": 10, "llm": "gpt-4", "use_async": true, "ignore_tool_type": true, "start_time": "2023-09-18 19:40:34"}
{"total": 100, "avg_time_per_sample": "0:00:34.357445", "success": 34, "fail": 66, "<class 'asyncio.exceptions.TimeoutError'>": 66}
{"total": 200, "avg_time_per_sample": "0:00:48.121701", "success": 49, "fail": 151, "<class 'asyncio.exceptions.TimeoutError'>": 151}
{"total": 300, "avg_time_per_sample": "0:00:45.183257", "success": 73, "fail": 227, "<class 'asyncio.exceptions.TimeoutError'>": 226, "<class '__main__.ContentFormatError'>": 1}
{"total": 400, "avg_time_per_sample": "0:00:45.183257", "success": 73, "fail": 327, "<class 'asyncio.exceptions.TimeoutError'>": 326, "<class '__main__.ContentFormatError'>": 1}
{"total": 500, "avg_time_per_sample": "0:01:02.538147", "success": 85, "fail": 415, "<class 'asyncio.exceptions.TimeoutError'>": 413, "<class '__main__.ContentFormatError'>": 1, "<class '__main__.RateLimitError'>": 1}
{"total": 600, "avg_time_per_sample": "0:01:08.502710", "success": 94, "fail": 506, "<class 'asyncio.exceptions.TimeoutError'>": 504, "<class '__main__.ContentFormatError'>": 1, "<class '__main__.RateLimitError'>": 1}
{"total": 700, "avg_time_per_sample": "0:01:08.502710", "success": 94, "fail": 606, "<class 'asyncio.exceptions.TimeoutError'>": 604, "<class '__main__.ContentFormatError'>": 1, "<class '__main__.RateLimitError'>": 1}
{"total": 800, "avg_time_per_sample": "0:01:08.502710", "success": 94, "fail": 706, "<class 'asyncio.exceptions.TimeoutError'>": 704, "<class '__main__.ContentFormatError'>": 1, "<class '__main__.RateLimitError'>": 1}
{"total": 900, "avg_time_per_sample": "0:01:08.502710", "success": 94, "fail": 806, "<class 'asyncio.exceptions.TimeoutError'>": 804, "<class '__main__.ContentFormatError'>": 1, "<class '__main__.RateLimitError'>": 1}
{"total": 1000, "avg_time_per_sample": "0:01:08.502710", "success": 94, "fail": 906, "<class 'asyncio.exceptions.TimeoutError'>": 904, "<class '__main__.ContentFormatError'>": 1, "<class '__main__.RateLimitError'>": 1}
{"total": 1100, "avg_time_per_sample": "0:01:08.502710", "success": 94, "fail": 1006, "<class 'asyncio.exceptions.TimeoutError'>": 1004, "<class '__main__.ContentFormatError'>": 1, "<class '__main__.RateLimitError'>": 1}
{"total": 1200, "avg_time_per_sample": "0:01:08.502710", "success": 94, "fail": 1106, "<class 'asyncio.exceptions.TimeoutError'>": 1104, "<class '__main__.ContentFormatError'>": 1, "<class '__main__.RateLimitError'>": 1}
{"temperature": 1.0, "top_p": 1.0, "check": true, "tool_graph": "graph_desc_apis.json", "tool_desc": "tools_desc_apis.json", "api_addr": "10.15.82.10", "api_port": 8002, "play": false, "method": null, "tool_number": null, "number_of_samples": 7000, "seed": -1, "output_dir": "result_20230918045336_tools_desc_apis_gpt-4_t1_0_p1_0_check", "save_figure": false, "multiworker": 10, "llm": "gpt-4", "use_async": true, "ignore_tool_type": true, "start_time": "2023-09-19 00:00:45"}
{"temperature": 1.0, "top_p": 1.0, "check": true, "tool_graph": "graph_desc_apis.json", "tool_desc": "tools_desc_apis.json", "api_addr": "10.15.82.10", "api_port": 8002, "play": false, "method": null, "tool_number": null, "number_of_samples": 7000, "seed": -1, "output_dir": "result_20230918045336_tools_desc_apis_gpt-4_t1_0_p1_0_check", "save_figure": false, "multiworker": 1, "llm": "gpt-4", "use_async": true, "ignore_tool_type": true, "start_time": "2023-09-19 00:16:06"}
{"temperature": 1.0, "top_p": 1.0, "check": true, "tool_graph": "graph_desc_apis.json", "tool_desc": "tools_desc_apis.json", "api_addr": "10.15.82.10", "api_port": 8002, "play": false, "method": null, "tool_number": null, "number_of_samples": 7000, "seed": -1, "output_dir": "result_20230918045336_tools_desc_apis_gpt-4_t1_0_p1_0_check", "save_figure": false, "multiworker": 1, "llm": "gpt-4", "use_async": true, "ignore_tool_type": true, "start_time": "2023-09-19 00:27:14"}
{"total": 100, "avg_time_per_sample": 0, "success": 0, "fail": 100, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 92}
{"total": 200, "avg_time_per_sample": 0, "success": 0, "fail": 200, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 192}
{"total": 300, "avg_time_per_sample": 0, "success": 0, "fail": 300, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 292}
{"total": 400, "avg_time_per_sample": 0, "success": 0, "fail": 400, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 392}
{"total": 500, "avg_time_per_sample": 0, "success": 0, "fail": 500, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 492}
{"total": 600, "avg_time_per_sample": 0, "success": 0, "fail": 600, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 592}
{"total": 700, "avg_time_per_sample": 0, "success": 0, "fail": 700, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 692}
{"total": 800, "avg_time_per_sample": 0, "success": 0, "fail": 800, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 792}
{"total": 900, "avg_time_per_sample": 0, "success": 0, "fail": 900, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 892}
{"total": 1000, "avg_time_per_sample": 0, "success": 0, "fail": 1000, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 992}
{"total": 1100, "avg_time_per_sample": 0, "success": 0, "fail": 1100, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 1092}
{"total": 1200, "avg_time_per_sample": 0, "success": 0, "fail": 1200, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 1192}
{"total": 1300, "avg_time_per_sample": 0, "success": 0, "fail": 1300, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 1292}
{"total": 1400, "avg_time_per_sample": 0, "success": 0, "fail": 1400, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 1392}
{"total": 1500, "avg_time_per_sample": 0, "success": 0, "fail": 1500, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 1492}
{"total": 1600, "avg_time_per_sample": 0, "success": 0, "fail": 1600, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 1592}
{"total": 1700, "avg_time_per_sample": 0, "success": 0, "fail": 1700, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 1692}
{"total": 1800, "avg_time_per_sample": 0, "success": 0, "fail": 1800, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 1792}
{"total": 1900, "avg_time_per_sample": 0, "success": 0, "fail": 1900, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 1892}
{"total": 2000, "avg_time_per_sample": 0, "success": 0, "fail": 2000, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 1992}
{"total": 2100, "avg_time_per_sample": 0, "success": 0, "fail": 2100, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 2092}
{"total": 2200, "avg_time_per_sample": 0, "success": 0, "fail": 2200, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 2192}
{"total": 2300, "avg_time_per_sample": 0, "success": 0, "fail": 2300, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 2292}
{"total": 2400, "avg_time_per_sample": 0, "success": 0, "fail": 2400, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 2392}
{"total": 2500, "avg_time_per_sample": 0, "success": 0, "fail": 2500, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 2492}
{"total": 2600, "avg_time_per_sample": 0, "success": 0, "fail": 2600, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 2592}
{"total": 2700, "avg_time_per_sample": 0, "success": 0, "fail": 2700, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 2692}
{"total": 2800, "avg_time_per_sample": 0, "success": 0, "fail": 2800, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 2792}
{"total": 2900, "avg_time_per_sample": 0, "success": 0, "fail": 2900, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 2892}
{"total": 3000, "avg_time_per_sample": 0, "success": 0, "fail": 3000, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 2992}
{"total": 3100, "avg_time_per_sample": 0, "success": 0, "fail": 3100, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 3092}
{"total": 3200, "avg_time_per_sample": 0, "success": 0, "fail": 3200, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 3192}
{"total": 3300, "avg_time_per_sample": 0, "success": 0, "fail": 3300, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 3292}
{"total": 3400, "avg_time_per_sample": 0, "success": 0, "fail": 3400, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 3392}
{"total": 3500, "avg_time_per_sample": 0, "success": 0, "fail": 3500, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 3492}
{"total": 3600, "avg_time_per_sample": 0, "success": 0, "fail": 3600, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 3592}
{"total": 3700, "avg_time_per_sample": 0, "success": 0, "fail": 3700, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 3692}
{"total": 3800, "avg_time_per_sample": 0, "success": 0, "fail": 3800, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 3792}
{"total": 3900, "avg_time_per_sample": 0, "success": 0, "fail": 3900, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 3892}
{"total": 4000, "avg_time_per_sample": 0, "success": 0, "fail": 4000, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 3992}
{"total": 4100, "avg_time_per_sample": 0, "success": 0, "fail": 4100, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 4092}
{"total": 4200, "avg_time_per_sample": 0, "success": 0, "fail": 4200, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 4192}
{"total": 4300, "avg_time_per_sample": 0, "success": 0, "fail": 4300, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 4292}
{"total": 4400, "avg_time_per_sample": 0, "success": 0, "fail": 4400, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 4392}
{"total": 4500, "avg_time_per_sample": 0, "success": 0, "fail": 4500, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 4492}
{"total": 4600, "avg_time_per_sample": 0, "success": 0, "fail": 4600, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 4592}
{"total": 4700, "avg_time_per_sample": 0, "success": 0, "fail": 4700, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 4692}
{"total": 4800, "avg_time_per_sample": 0, "success": 0, "fail": 4800, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'aiohttp.client_exceptions.ServerDisconnectedError'>": 1, "<class 'aiohttp.client_exceptions.ClientConnectorError'>": 4792}
{"temperature": 1.0, "top_p": 1.0, "check": true, "tool_graph": "graph_desc_apis.json", "tool_desc": "tools_desc_apis.json", "api_addr": "10.15.82.10", "api_port": 8002, "play": false, "method": null, "tool_number": null, "number_of_samples": 7000, "seed": -1, "output_dir": "result_20230918045336_tools_desc_apis_gpt-4_t1_0_p1_0_check", "save_figure": false, "multiworker": 1, "llm": "gpt-4", "use_async": true, "ignore_tool_type": true, "start_time": "2023-09-19 00:43:34"}
{"temperature": 1.0, "top_p": 1.0, "check": true, "tool_graph": "graph_desc_apis.json", "tool_desc": "tools_desc_apis.json", "api_addr": "10.15.82.10", "api_port": 8002, "play": false, "method": null, "tool_number": null, "number_of_samples": 7000, "seed": -1, "output_dir": "result_20230918045336_tools_desc_apis_gpt-4_t1_0_p1_0_check", "save_figure": false, "multiworker": 5, "llm": "gpt-4", "use_async": true, "ignore_tool_type": true, "start_time": "2023-09-19 00:44:56"}
{"total": 100, "avg_time_per_sample": "0:00:10.411061", "success": 95, "fail": 5, "<class '__main__.ContentFormatError'>": 1, "<class '__main__.RateLimitError'>": 4}
{"total": 200, "avg_time_per_sample": "0:00:12.987285", "success": 169, "fail": 31, "<class '__main__.ContentFormatError'>": 1, "<class '__main__.RateLimitError'>": 29, "<class 'asyncio.exceptions.TimeoutError'>": 1}
{"total": 300, "avg_time_per_sample": "0:00:13.234775", "success": 245, "fail": 55, "<class '__main__.ContentFormatError'>": 3, "<class '__main__.RateLimitError'>": 49, "<class 'asyncio.exceptions.TimeoutError'>": 2, "<class 'KeyError'>": 1}
{"total": 400, "avg_time_per_sample": "0:00:12.980151", "success": 333, "fail": 67, "<class '__main__.ContentFormatError'>": 5, "<class '__main__.RateLimitError'>": 59, "<class 'asyncio.exceptions.TimeoutError'>": 2, "<class 'KeyError'>": 1}
{"total": 500, "avg_time_per_sample": "0:00:13.406214", "success": 413, "fail": 87, "<class '__main__.ContentFormatError'>": 7, "<class '__main__.RateLimitError'>": 77, "<class 'asyncio.exceptions.TimeoutError'>": 2, "<class 'KeyError'>": 1}
{"total": 600, "avg_time_per_sample": "0:00:13.788642", "success": 487, "fail": 113, "<class '__main__.ContentFormatError'>": 7, "<class '__main__.RateLimitError'>": 100, "<class 'asyncio.exceptions.TimeoutError'>": 5, "<class 'KeyError'>": 1}
{"total": 700, "avg_time_per_sample": "0:00:14.085124", "success": 564, "fail": 136, "<class '__main__.ContentFormatError'>": 7, "<class '__main__.RateLimitError'>": 121, "<class 'asyncio.exceptions.TimeoutError'>": 7, "<class 'KeyError'>": 1}
{"total": 800, "avg_time_per_sample": "0:00:14.321462", "success": 641, "fail": 159, "<class '__main__.ContentFormatError'>": 8, "<class '__main__.RateLimitError'>": 141, "<class 'asyncio.exceptions.TimeoutError'>": 9, "<class 'KeyError'>": 1}
{"total": 900, "avg_time_per_sample": "0:00:14.659003", "success": 713, "fail": 187, "<class '__main__.ContentFormatError'>": 8, "<class '__main__.RateLimitError'>": 168, "<class 'asyncio.exceptions.TimeoutError'>": 9, "<class 'KeyError'>": 2}
{"total": 1000, "avg_time_per_sample": "0:00:15.153823", "success": 775, "fail": 225, "<class '__main__.ContentFormatError'>": 9, "<class '__main__.RateLimitError'>": 203, "<class 'asyncio.exceptions.TimeoutError'>": 10, "<class 'KeyError'>": 3}
{"total": 1100, "avg_time_per_sample": "0:00:15.290999", "success": 844, "fail": 256, "<class '__main__.ContentFormatError'>": 9, "<class '__main__.RateLimitError'>": 234, "<class 'asyncio.exceptions.TimeoutError'>": 10, "<class 'KeyError'>": 3}
{"total": 1200, "avg_time_per_sample": "0:00:15.558860", "success": 910, "fail": 290, "<class '__main__.ContentFormatError'>": 10, "<class '__main__.RateLimitError'>": 267, "<class 'asyncio.exceptions.TimeoutError'>": 10, "<class 'KeyError'>": 3}
{"total": 1300, "avg_time_per_sample": "0:00:15.603290", "success": 988, "fail": 312, "<class '__main__.ContentFormatError'>": 11, "<class '__main__.RateLimitError'>": 285, "<class 'asyncio.exceptions.TimeoutError'>": 13, "<class 'KeyError'>": 3}
{"total": 1400, "avg_time_per_sample": "0:00:15.548603", "success": 1066, "fail": 334, "<class '__main__.ContentFormatError'>": 12, "<class '__main__.RateLimitError'>": 306, "<class 'asyncio.exceptions.TimeoutError'>": 13, "<class 'KeyError'>": 3}
{"total": 1500, "avg_time_per_sample": "0:00:15.594365", "success": 1139, "fail": 361, "<class '__main__.ContentFormatError'>": 16, "<class '__main__.RateLimitError'>": 328, "<class 'asyncio.exceptions.TimeoutError'>": 13, "<class 'KeyError'>": 4}
{"total": 1600, "avg_time_per_sample": "0:00:15.563565", "success": 1221, "fail": 379, "<class '__main__.ContentFormatError'>": 17, "<class '__main__.RateLimitError'>": 344, "<class 'asyncio.exceptions.TimeoutError'>": 14, "<class 'KeyError'>": 4}
{"total": 1700, "avg_time_per_sample": "0:00:15.552764", "success": 1300, "fail": 400, "<class '__main__.ContentFormatError'>": 18, "<class '__main__.RateLimitError'>": 363, "<class 'asyncio.exceptions.TimeoutError'>": 15, "<class 'KeyError'>": 4}
{"total": 1800, "avg_time_per_sample": "0:00:15.551450", "success": 1376, "fail": 424, "<class '__main__.ContentFormatError'>": 21, "<class '__main__.RateLimitError'>": 384, "<class 'asyncio.exceptions.TimeoutError'>": 15, "<class 'KeyError'>": 4}
{"total": 1900, "avg_time_per_sample": "0:00:15.495613", "success": 1453, "fail": 447, "<class '__main__.ContentFormatError'>": 21, "<class '__main__.RateLimitError'>": 407, "<class 'asyncio.exceptions.TimeoutError'>": 15, "<class 'KeyError'>": 4}
{"total": 2000, "avg_time_per_sample": "0:00:15.496281", "success": 1526, "fail": 474, "<class '__main__.ContentFormatError'>": 22, "<class '__main__.RateLimitError'>": 432, "<class 'asyncio.exceptions.TimeoutError'>": 15, "<class 'KeyError'>": 5}
{"total": 2100, "avg_time_per_sample": "0:00:15.421484", "success": 1605, "fail": 495, "<class '__main__.ContentFormatError'>": 24, "<class '__main__.RateLimitError'>": 450, "<class 'asyncio.exceptions.TimeoutError'>": 16, "<class 'KeyError'>": 5}
{"total": 2200, "avg_time_per_sample": "0:00:15.353331", "success": 1681, "fail": 519, "<class '__main__.ContentFormatError'>": 24, "<class '__main__.RateLimitError'>": 474, "<class 'asyncio.exceptions.TimeoutError'>": 16, "<class 'KeyError'>": 5}
{"total": 2300, "avg_time_per_sample": "0:00:15.352390", "success": 1759, "fail": 541, "<class '__main__.ContentFormatError'>": 25, "<class '__main__.RateLimitError'>": 494, "<class 'asyncio.exceptions.TimeoutError'>": 17, "<class 'KeyError'>": 5}
{"total": 2400, "avg_time_per_sample": "0:00:15.305033", "success": 1835, "fail": 565, "<class '__main__.ContentFormatError'>": 26, "<class '__main__.RateLimitError'>": 515, "<class 'asyncio.exceptions.TimeoutError'>": 19, "<class 'KeyError'>": 5}
{"total": 2500, "avg_time_per_sample": "0:00:15.274257", "success": 1915, "fail": 585, "<class '__main__.ContentFormatError'>": 27, "<class '__main__.RateLimitError'>": 533, "<class 'asyncio.exceptions.TimeoutError'>": 20, "<class 'KeyError'>": 5}
{"total": 2600, "avg_time_per_sample": "0:00:15.400848", "success": 1979, "fail": 621, "<class '__main__.ContentFormatError'>": 30, "<class '__main__.RateLimitError'>": 566, "<class 'asyncio.exceptions.TimeoutError'>": 20, "<class 'KeyError'>": 5}
{"total": 2700, "avg_time_per_sample": "0:00:15.557061", "success": 2037, "fail": 663, "<class '__main__.ContentFormatError'>": 31, "<class '__main__.RateLimitError'>": 607, "<class 'asyncio.exceptions.TimeoutError'>": 20, "<class 'KeyError'>": 5}
{"total": 2800, "avg_time_per_sample": "0:00:15.545819", "success": 2115, "fail": 685, "<class '__main__.ContentFormatError'>": 33, "<class '__main__.RateLimitError'>": 627, "<class 'asyncio.exceptions.TimeoutError'>": 20, "<class 'KeyError'>": 5}
{"total": 2900, "avg_time_per_sample": "0:00:15.568062", "success": 2191, "fail": 709, "<class '__main__.ContentFormatError'>": 34, "<class '__main__.RateLimitError'>": 648, "<class 'asyncio.exceptions.TimeoutError'>": 22, "<class 'KeyError'>": 5}
{"total": 3000, "avg_time_per_sample": "0:00:15.759779", "success": 2245, "fail": 755, "<class '__main__.ContentFormatError'>": 34, "<class '__main__.RateLimitError'>": 692, "<class 'asyncio.exceptions.TimeoutError'>": 24, "<class 'KeyError'>": 5}
{"total": 3100, "avg_time_per_sample": "0:00:16.019353", "success": 2288, "fail": 812, "<class '__main__.ContentFormatError'>": 35, "<class '__main__.RateLimitError'>": 746, "<class 'asyncio.exceptions.TimeoutError'>": 26, "<class 'KeyError'>": 5}
{"total": 3200, "avg_time_per_sample": "0:00:16.316532", "success": 2328, "fail": 872, "<class '__main__.ContentFormatError'>": 37, "<class '__main__.RateLimitError'>": 800, "<class 'asyncio.exceptions.TimeoutError'>": 29, "<class 'KeyError'>": 5, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 1}
{"total": 3300, "avg_time_per_sample": "0:00:16.640744", "success": 2364, "fail": 936, "<class '__main__.ContentFormatError'>": 39, "<class '__main__.RateLimitError'>": 862, "<class 'asyncio.exceptions.TimeoutError'>": 29, "<class 'KeyError'>": 5, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 1}
{"total": 3400, "avg_time_per_sample": "0:00:16.913796", "success": 2403, "fail": 997, "<class '__main__.ContentFormatError'>": 41, "<class '__main__.RateLimitError'>": 920, "<class 'asyncio.exceptions.TimeoutError'>": 30, "<class 'KeyError'>": 5, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 1}
{"total": 3500, "avg_time_per_sample": "0:00:17.224395", "success": 2430, "fail": 1070, "<class '__main__.ContentFormatError'>": 42, "<class '__main__.RateLimitError'>": 991, "<class 'asyncio.exceptions.TimeoutError'>": 31, "<class 'KeyError'>": 5, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 1}
{"total": 3600, "avg_time_per_sample": "0:00:17.500923", "success": 2467, "fail": 1133, "<class '__main__.ContentFormatError'>": 42, "<class '__main__.RateLimitError'>": 1054, "<class 'asyncio.exceptions.TimeoutError'>": 31, "<class 'KeyError'>": 5, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 1}
{"total": 3700, "avg_time_per_sample": "0:00:17.757566", "success": 2504, "fail": 1196, "<class '__main__.ContentFormatError'>": 42, "<class '__main__.RateLimitError'>": 1116, "<class 'asyncio.exceptions.TimeoutError'>": 31, "<class 'KeyError'>": 6, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 1}
{"total": 3800, "avg_time_per_sample": "0:00:17.993460", "success": 2542, "fail": 1258, "<class '__main__.ContentFormatError'>": 43, "<class '__main__.RateLimitError'>": 1177, "<class 'asyncio.exceptions.TimeoutError'>": 31, "<class 'KeyError'>": 6, "<class 'aiohttp.client_exceptions.ContentTypeError'>": 1}
