{"accuracy": 0.92, "correct_count": 184, "total_count": 200}
{"id": "parallel_9", "model_name": "D-CORE-14B", "test_category": "parallel", "valid": false, "error": ["Wrong number of functions."], "error_type": "parallel_function_checker_no_order:wrong_count", "prompt": {"id": "parallel_9", "question": [[{"role": "user", "content": "Find two movie theatres near San Diego with availability for Tenet at 5 pm and No Time To Die at 7:30 pm."}]], "function": [{"name": "find_movie_showing", "description": "Find local movie theatres and their schedule for a specific movie", "parameters": {"type": "dict", "properties": {"location": {"type": "string", "description": "The city and state, e.g. San Diego, CA"}, "movie": {"type": "array", "items": {"type": "string", "enum": ["Tenet", "No Time To Die"]}, "description": "Preferred movie to watch."}, "time": {"type": "array", "items": {"type": "string", "description": "Show time for each movie"}}}, "required": ["location", "movie", "time"]}}]}, "model_result_raw": "\n[find_movie_showing(location=\"San Diego, CA\", movie=[\"Tenet\", \"No Time To Die\"], time=[\"5:00 PM\", \"7:30 PM\"])]", "model_result_decoded": [{"find_movie_showing": {"location": "San Diego, CA", "movie": ["Tenet", "No Time To Die"], "time": ["5:00 PM", "7:30 PM"]}}], "possible_answer": [{"find_movie_showing": {"location": ["San Diego", "San Diego, CA", "CA"], "movie": [["Tenet"]], "time": [["5 pm"], ["17:00"]]}}, {"find_movie_showing": {"location": ["San Diego", "San Diego, CA", "CA"], "movie": [["No Time To Die"]], "time": [["7:30 pm"], ["19:30"]]}}]}
{"id": "parallel_19", "model_name": "D-CORE-14B", "test_category": "parallel", "valid": false, "error": ["Could not find a matching function among index [0, 1, 2] of model output for index 0 of possible answers.", {"Model Result Index 0": {"sub_error": ["Invalid value for parameter 'interest_rate': 4.0. Expected one of [0.04]."], "sub_error_type": "value_error:others", "model_output_item": {"calculate_mortgage_payment": {"loan_amount": 400000, "interest_rate": 4.0, "loan_term": 15}}, "possible_answer_item": {"calculate_mortgage_payment": {"loan_amount": [400000], "interest_rate": [0.04], "loan_term": [15]}}}}, {"Model Result Index 1": {"sub_error": ["Invalid value for parameter 'interest_rate': 4.0. Expected one of [0.04]."], "sub_error_type": "value_error:others", "model_output_item": {"calculate_mortgage_payment": {"loan_amount": 400000, "interest_rate": 4.0, "loan_term": 20}}, "possible_answer_item": {"calculate_mortgage_payment": {"loan_amount": [400000], "interest_rate": [0.04], "loan_term": [15]}}}}, {"Model Result Index 2": {"sub_error": ["Invalid value for parameter 'interest_rate': 4.0. Expected one of [0.04]."], "sub_error_type": "value_error:others", "model_output_item": {"calculate_mortgage_payment": {"loan_amount": 400000, "interest_rate": 4.0, "loan_term": 30}}, "possible_answer_item": {"calculate_mortgage_payment": {"loan_amount": [400000], "interest_rate": [0.04], "loan_term": [15]}}}}], "error_type": "parallel_function_checker_no_order:cannot_find_match", "prompt": {"id": "parallel_19", "question": [[{"role": "user", "content": "Calculate the monthly mortgage payment for a loan amount of $400,000, with an annual interest rate of 4% and a loan term of 15, 20 and 30 years."}]], "function": [{"name": "calculate_mortgage_payment", "description": "Calculate the monthly mortgage payment for a given loan amount, interest rate, and loan term.", "parameters": {"type": "dict", "properties": {"loan_amount": {"type": "integer", "description": "The loan amount."}, "interest_rate": {"type": "float", "description": "The annual interest rate."}, "loan_term": {"type": "integer", "description": "The loan term in years."}}, "required": ["loan_amount", "interest_rate", "loan_term"]}}]}, "model_result_raw": "\n[calculate_mortgage_payment(loan_amount=400000, interest_rate=4.0, loan_term=15), calculate_mortgage_payment(loan_amount=400000, interest_rate=4.0, loan_term=20), calculate_mortgage_payment(loan_amount=400000, interest_rate=4.0, loan_term=30)]", "model_result_decoded": [{"calculate_mortgage_payment": {"loan_amount": 400000, "interest_rate": 4.0, "loan_term": 15}}, {"calculate_mortgage_payment": {"loan_amount": 400000, "interest_rate": 4.0, "loan_term": 20}}, {"calculate_mortgage_payment": {"loan_amount": 400000, "interest_rate": 4.0, "loan_term": 30}}], "possible_answer": [{"calculate_mortgage_payment": {"loan_amount": [400000], "interest_rate": [0.04], "loan_term": [15]}}, {"calculate_mortgage_payment": {"loan_amount": [400000], "interest_rate": [0.04], "loan_term": [20]}}, {"calculate_mortgage_payment": {"loan_amount": [400000], "interest_rate": [0.04], "loan_term": [30]}}]}
{"id": "parallel_22", "model_name": "D-CORE-14B", "test_category": "parallel", "valid": false, "error": ["Could not find a matching function among index [0, 1, 2, 3] of model output for index 0 of possible answers.", {"Model Result Index 0": {"sub_error": ["Invalid value for parameter 'court': 'Los Angeles County'. Expected one of ['Los Angeles County Court', 'Los Angeles', 'Los Angeles, CA', 'LA']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"court_info.get_case_status": {"case_number": "XY1234", "court": "Los Angeles County", "details": "status"}}, "possible_answer_item": {"court_info.get_case_status": {"case_number": ["XY1234"], "court": ["Los Angeles County Court", "Los Angeles", "Los Angeles, CA", "LA"], "details": ["status", ""]}}}}, {"Model Result Index 1": {"sub_error": ["Invalid value for parameter 'court': 'Los Angeles County'. Expected one of ['Los Angeles County Court', 'Los Angeles', 'Los Angeles, CA', 'LA']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"court_info.get_case_status": {"case_number": "XY1234", "court": "Los Angeles County", "details": "trial_date"}}, "possible_answer_item": {"court_info.get_case_status": {"case_number": ["XY1234"], "court": ["Los Angeles County Court", "Los Angeles", "Los Angeles, CA", "LA"], "details": ["status", ""]}}}}, {"Model Result Index 2": {"sub_error": ["Invalid value for parameter 'case_number': 'GH5678'. Expected one of ['XY1234']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"court_info.get_case_status": {"case_number": "GH5678", "court": "Orange County", "details": "status"}}, "possible_answer_item": {"court_info.get_case_status": {"case_number": ["XY1234"], "court": ["Los Angeles County Court", "Los Angeles", "Los Angeles, CA", "LA"], "details": ["status", ""]}}}}, {"Model Result Index 3": {"sub_error": ["Invalid value for parameter 'case_number': 'GH5678'. Expected one of ['XY1234']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"court_info.get_case_status": {"case_number": "GH5678", "court": "Orange County", "details": "trial_date"}}, "possible_answer_item": {"court_info.get_case_status": {"case_number": ["XY1234"], "court": ["Los Angeles County Court", "Los Angeles", "Los Angeles, CA", "LA"], "details": ["status", ""]}}}}], "error_type": "parallel_function_checker_no_order:cannot_find_match", "prompt": {"id": "parallel_22", "question": [[{"role": "user", "content": "What is the status and scheduled trial date for case number XY1234 in Los Angeles County Court, and case number GH5678 in Orange County Court?"}]], "function": [{"name": "court_info.get_case_status", "description": "Retrieves the status and trial dates for court cases from specified county courts.", "parameters": {"type": "dict", "properties": {"case_number": {"type": "string", "description": "The specific court case number."}, "court": {"type": "string", "description": "The county court where the case is filed."}, "details": {"type": "string", "enum": ["status", "trial_date"], "description": "Specific details required about the court case. Defaults to 'status'."}}, "required": ["case_number", "court"]}}]}, "model_result_raw": "\n[court_info.get_case_status(case_number=\"XY1234\", court=\"Los Angeles County\", details=\"status\"), court_info.get_case_status(case_number=\"XY1234\", court=\"Los Angeles County\", details=\"trial_date\"), court_info.get_case_status(case_number=\"GH5678\", court=\"Orange County\", details=\"status\"), court_info.get_case_status(case_number=\"GH5678\", court=\"Orange County\", details=\"trial_date\")]", "model_result_decoded": [{"court_info.get_case_status": {"case_number": "XY1234", "court": "Los Angeles County", "details": "status"}}, {"court_info.get_case_status": {"case_number": "XY1234", "court": "Los Angeles County", "details": "trial_date"}}, {"court_info.get_case_status": {"case_number": "GH5678", "court": "Orange County", "details": "status"}}, {"court_info.get_case_status": {"case_number": "GH5678", "court": "Orange County", "details": "trial_date"}}], "possible_answer": [{"court_info.get_case_status": {"case_number": ["XY1234"], "court": ["Los Angeles County Court", "Los Angeles", "Los Angeles, CA", "LA"], "details": ["status", ""]}}, {"court_info.get_case_status": {"case_number": ["GH5678"], "court": ["Orange County Court", "Orange County", "OC"], "details": ["status", ""]}}, {"court_info.get_case_status": {"case_number": ["XY1234"], "court": ["Los Angeles County Court", "Los Angeles", "Los Angeles, CA", "LA"], "details": ["trial_date"]}}, {"court_info.get_case_status": {"case_number": ["GH5678"], "court": ["Orange County Court", "Orange County", "OC"], "details": ["trial_date"]}}]}
{"id": "parallel_26", "model_name": "D-CORE-14B", "test_category": "parallel", "valid": false, "error": ["Wrong number of functions."], "error_type": "parallel_function_checker_no_order:wrong_count", "prompt": {"id": "parallel_26", "question": [[{"role": "user", "content": "Find details of lawsuits with case numbers '67813', '71249' filed in the New York District court for type 'Civil' and 'Criminal' cases."}]], "function": [{"name": "court_case.find", "description": "Locate details of court cases based on specific parameters like case number and case type.", "parameters": {"type": "dict", "properties": {"location": {"type": "string", "description": "The city and court where the lawsuit is filed."}, "case_number": {"type": "array", "items": {"type": "string"}, "description": "The unique case numbers of the lawsuits."}, "case_type": {"type": "string", "enum": ["Civil", "Criminal"], "description": "Type of the court case.", "default": "Civil"}}, "required": ["location", "case_number"]}}]}, "model_result_raw": "\n[court_case.find(location=\"New York District\", case_number=[\"67813\", \"71249\"], case_type=\"Civil\"), court_case.find(location=\"New York District\", case_number=[\"67813\", \"71249\"], case_type=\"Criminal\")]", "model_result_decoded": [{"court_case.find": {"location": "New York District", "case_number": ["67813", "71249"], "case_type": "Civil"}}, {"court_case.find": {"location": "New York District", "case_number": ["67813", "71249"], "case_type": "Criminal"}}], "possible_answer": [{"court_case.find": {"location": ["New York District", "NY District", "New York", "New York, NY", "NY"], "case_number": [["67813"]], "case_type": ["Civil", ""]}}, {"court_case.find": {"location": ["New York District", "NY District", "New York", "New York, NY", "NY"], "case_number": [["71249"]], "case_type": ["Criminal"]}}, {"court_case.find": {"location": ["New York District", "NY District", "New York", "New York, NY", "NY"], "case_number": [["67813"]], "case_type": ["Criminal"]}}, {"court_case.find": {"location": ["New York District", "NY District", "New York", "New York, NY", "NY"], "case_number": [["71249"]], "case_type": ["Civil", ""]}}]}
{"id": "parallel_27", "model_name": "D-CORE-14B", "test_category": "parallel", "valid": false, "error": ["Could not find a matching function among index [0, 1] of model output for index 0 of possible answers.", {"Model Result Index 0": {"sub_error": ["Invalid value for parameter 'location': 'Berkeley, CA'. Expected one of ['Berkeley', 'Berkeley,California', 'CA']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"nature_reserve.find_nearby": {"location": "Berkeley, CA", "amenities": ["Picnic Tables", "Public Restrooms"], "proximity": 10}}, "possible_answer_item": {"nature_reserve.find_nearby": {"location": ["Berkeley", "Berkeley,California", "CA"], "amenities": [["Picnic Tables", "Public Restrooms"], ["Public Restrooms", "Picnic Tables"]], "proximity": [10]}}}}, {"Model Result Index 1": {"sub_error": ["Invalid value for parameter 'location': 'Tokyo'. Expected one of ['Berkeley', 'Berkeley,California', 'CA']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"nature_reserve.find_nearby": {"location": "Tokyo", "amenities": ["Playgrounds", "Biking Trails"], "proximity": 5}}, "possible_answer_item": {"nature_reserve.find_nearby": {"location": ["Berkeley", "Berkeley,California", "CA"], "amenities": [["Picnic Tables", "Public Restrooms"], ["Public Restrooms", "Picnic Tables"]], "proximity": [10]}}}}], "error_type": "parallel_function_checker_no_order:cannot_find_match", "prompt": {"id": "parallel_27", "question": [[{"role": "user", "content": "Find a nature reserve around Berkeley within 10 kilometers that has picnic tables and public restrooms, as well as one around Tokyo within 5 kilometers that has playgrounds and biking trails."}]], "function": [{"name": "nature_reserve.find_nearby", "description": "Locate nearby nature reserves based on specific criteria such as amenities and proximity.", "parameters": {"type": "dict", "properties": {"location": {"type": "string", "description": "The city where you want to locate a nature reserve."}, "amenities": {"type": "array", "items": {"type": "string", "enum": ["Picnic Tables", "Public Restrooms", "Playgrounds", "Biking Trails", "Hiking Trails", "Camping Grounds"]}, "description": "Preferred amenities in the nature reserve."}, "proximity": {"type": "integer", "description": "The radius within which to look for nature reserves in kilometers."}}, "required": ["location", "proximity", "amenities"]}}]}, "model_result_raw": "\n[nature_reserve.find_nearby(location=\"Berkeley, CA\", amenities=[\"Picnic Tables\", \"Public Restrooms\"], proximity=10), nature_reserve.find_nearby(location=\"Tokyo\", amenities=[\"Playgrounds\", \"Biking Trails\"], proximity=5)]", "model_result_decoded": [{"nature_reserve.find_nearby": {"location": "Berkeley, CA", "amenities": ["Picnic Tables", "Public Restrooms"], "proximity": 10}}, {"nature_reserve.find_nearby": {"location": "Tokyo", "amenities": ["Playgrounds", "Biking Trails"], "proximity": 5}}], "possible_answer": [{"nature_reserve.find_nearby": {"location": ["Berkeley", "Berkeley,California", "CA"], "amenities": [["Picnic Tables", "Public Restrooms"], ["Public Restrooms", "Picnic Tables"]], "proximity": [10]}}, {"nature_reserve.find_nearby": {"location": ["Tokyo"], "amenities": [["Playgrounds", "Biking Trails"], ["Biking Trails", "Playgrounds"]], "proximity": [5]}}]}
{"id": "parallel_29", "model_name": "D-CORE-14B", "test_category": "parallel", "valid": false, "error": ["Could not find a matching function among index [1] of model output for index 1 of possible answers.", {"Model Result Index 1": {"sub_error": ["Invalid value for parameter 'adults': 1. Expected one of [0]."], "sub_error_type": "value_error:dict_value", "model_output_item": {"waste_calculation.calculate": {"population": {"adults": 1, "children": 0, "singles": 1}, "location": "New York"}}, "possible_answer_item": {"waste_calculation.calculate": {"population": [{"adults": [0], "children": [0], "singles": [1]}], "location": ["New York", "New York, NY", "NY", "New York City", "NYC"]}}}}], "error_type": "parallel_function_checker_no_order:cannot_find_match", "prompt": {"id": "parallel_29", "question": [[{"role": "user", "content": "Find out how much waste a family of four generates in Los Angeles, assuming two children and two adults. Also, calculate waste production for a bachelor in New York."}]], "function": [{"name": "waste_calculation.calculate", "description": "Calculates the estimated waste generated by different population sizes in a specific location.", "parameters": {"type": "dict", "properties": {"population": {"type": "dict", "description": "The description of population. 'adults' is the number of adults in the household. 'children' is the number of children. 'singles' is the number of single adults living alone.", "required": ["adults", "children", "singles"]}, "location": {"type": "string", "description": "The city where the population resides."}}, "required": ["population", "location"]}}]}, "model_result_raw": "\n[waste_calculation.calculate(population={\"adults\": 2, \"children\": 2, \"singles\": 0}, location=\"Los Angeles\"), waste_calculation.calculate(population={\"adults\": 1, \"children\": 0, \"singles\": 1}, location=\"New York\")]", "model_result_decoded": [{"waste_calculation.calculate": {"population": {"adults": 2, "children": 2, "singles": 0}, "location": "Los Angeles"}}, {"waste_calculation.calculate": {"population": {"adults": 1, "children": 0, "singles": 1}, "location": "New York"}}], "possible_answer": [{"waste_calculation.calculate": {"population": [{"adults": [2], "children": [2], "singles": [0]}], "location": ["Los Angeles", "Los Angeles, CA", "LA"]}}, {"waste_calculation.calculate": {"population": [{"adults": [0], "children": [0], "singles": [1]}], "location": ["New York", "New York, NY", "NY", "New York City", "NYC"]}}]}
{"id": "parallel_38", "model_name": "D-CORE-14B", "test_category": "parallel", "valid": false, "error": ["Could not find a matching function among index [0, 1] of model output for index 0 of possible answers.", {"Model Result Index 0": {"sub_error": ["Optional parameter 'shortest_route' not provided and not marked as optional."], "sub_error_type": "simple_function_checker:missing_optional", "model_output_item": {"calc_distance": {"start_loc": "New York", "end_loc": "Washington DC"}}, "possible_answer_item": {"calc_distance": {"start_loc": ["New York", "New York, NY", "New York City", "NYC"], "end_loc": ["Washington DC", "Washington D.C."], "shortest_route": [true]}}}}, {"Model Result Index 1": {"sub_error": ["Invalid value for parameter 'start_loc': 'Los Angeles'. Expected one of ['New York', 'New York, NY', 'New York City', 'NYC']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"calc_distance": {"start_loc": "Los Angeles", "end_loc": "San Francisco", "shortest_route": true}}, "possible_answer_item": {"calc_distance": {"start_loc": ["New York", "New York, NY", "New York City", "NYC"], "end_loc": ["Washington DC", "Washington D.C."], "shortest_route": [true]}}}}], "error_type": "parallel_function_checker_no_order:cannot_find_match", "prompt": {"id": "parallel_38", "question": [[{"role": "user", "content": "What's the driving distance between New York and Washington DC, and between Los Angeles and San Francisco with optional parameter shortest route enabled?"}]], "function": [{"name": "calc_distance", "description": "Calculate the driving distance between two locations.", "parameters": {"type": "dict", "properties": {"start_loc": {"type": "string", "description": "Starting location."}, "end_loc": {"type": "string", "description": "Ending location."}, "shortest_route": {"type": "boolean", "default": "false", "description": "If true, returns the shortest driving route."}}, "required": ["start_loc", "end_loc"]}}]}, "model_result_raw": "\n[calc_distance(start_loc=\"New York\", end_loc=\"Washington DC\"), calc_distance(start_loc=\"Los Angeles\", end_loc=\"San Francisco\", shortest_route=True)]", "model_result_decoded": [{"calc_distance": {"start_loc": "New York", "end_loc": "Washington DC"}}, {"calc_distance": {"start_loc": "Los Angeles", "end_loc": "San Francisco", "shortest_route": true}}], "possible_answer": [{"calc_distance": {"start_loc": ["New York", "New York, NY", "New York City", "NYC"], "end_loc": ["Washington DC", "Washington D.C."], "shortest_route": [true]}}, {"calc_distance": {"start_loc": ["Los Angeles", "Los Angeles, CA", "LA"], "end_loc": ["San Francisco", "SF"], "shortest_route": [true]}}]}
{"id": "parallel_41", "model_name": "D-CORE-14B", "test_category": "parallel", "valid": false, "error": ["Could not find a matching function among index [0, 1] of model output for index 0 of possible answers.", {"Model Result Index 0": {"sub_error": ["Invalid value for parameter 'instruments': ['Yamaha acoustic guitars', 'Kawai pianos']. Expected one of [['Yamaha Acoustic Guitar', 'Kawai Piano'], ['Kawai Piano', 'Yamaha Acoustic Guitar'], ['Yamaha acoustic guitar', 'Kawai piano'], ['Kawai piano', 'Yamaha acoustic guitar']]."], "sub_error_type": "value_error:list/tuple", "model_output_item": {"find_music_instrument_store": {"location": "San Francisco, CA", "instruments": ["Yamaha acoustic guitars", "Kawai pianos"]}}, "possible_answer_item": {"find_music_instrument_store": {"location": ["San Francisco, CA", "San Francisco, CA", "San Francisco, California"], "instruments": [["Yamaha Acoustic Guitar", "Kawai Piano"], ["Kawai Piano", "Yamaha Acoustic Guitar"], ["Yamaha acoustic guitar", "Kawai piano"], ["Kawai piano", "Yamaha acoustic guitar"]]}}}}, {"Model Result Index 1": {"sub_error": ["Invalid value for parameter 'location': 'Chicago, IL'. Expected one of ['San Francisco, CA', 'San Francisco, CA', 'San Francisco, California']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"find_music_instrument_store": {"location": "Chicago, IL", "instruments": ["Yamaha acoustic guitars", "Kawai pianos"]}}, "possible_answer_item": {"find_music_instrument_store": {"location": ["San Francisco, CA", "San Francisco, CA", "San Francisco, California"], "instruments": [["Yamaha Acoustic Guitar", "Kawai Piano"], ["Kawai Piano", "Yamaha Acoustic Guitar"], ["Yamaha acoustic guitar", "Kawai piano"], ["Kawai piano", "Yamaha acoustic guitar"]]}}}}], "error_type": "parallel_function_checker_no_order:cannot_find_match", "prompt": {"id": "parallel_41", "question": [[{"role": "user", "content": "Show me the closest music shop where I can purchase a Yamaha acoustic guitar and a Kawai piano in San Francisco, California, and Chicago, Illinois."}]], "function": [{"name": "find_music_instrument_store", "description": "Locate nearby music instrument stores that sell specific brands or instruments", "parameters": {"type": "dict", "properties": {"location": {"type": "string", "description": "The city and state e.g. San Francisco, CA."}, "instruments": {"type": "array", "items": {"type": "string"}, "description": "A list of specific instruments or brands you are looking for."}}, "required": ["location", "instruments"]}}]}, "model_result_raw": "\n[find_music_instrument_store(location=\"San Francisco, CA\", instruments=[\"Yamaha acoustic guitars\", \"Kawai pianos\"]), find_music_instrument_store(location=\"Chicago, IL\", instruments=[\"Yamaha acoustic guitars\", \"Kawai pianos\"])]", "model_result_decoded": [{"find_music_instrument_store": {"location": "San Francisco, CA", "instruments": ["Yamaha acoustic guitars", "Kawai pianos"]}}, {"find_music_instrument_store": {"location": "Chicago, IL", "instruments": ["Yamaha acoustic guitars", "Kawai pianos"]}}], "possible_answer": [{"find_music_instrument_store": {"location": ["San Francisco, CA", "San Francisco, CA", "San Francisco, California"], "instruments": [["Yamaha Acoustic Guitar", "Kawai Piano"], ["Kawai Piano", "Yamaha Acoustic Guitar"], ["Yamaha acoustic guitar", "Kawai piano"], ["Kawai piano", "Yamaha acoustic guitar"]]}}, {"find_music_instrument_store": {"location": ["Chicago, IL", "Chicago, Illinois", "Chicago, IL."], "instruments": [["Yamaha Acoustic Guitar", "Kawai Piano"], ["Kawai Piano", "Yamaha Acoustic Guitar"], ["Yamaha acoustic guitar", "Kawai piano"], ["Kawai piano", "Yamaha acoustic guitar"]]}}]}
{"id": "parallel_44", "model_name": "D-CORE-14B", "test_category": "parallel", "valid": false, "error": ["Could not find a matching function among index [0, 1] of model output for index 0 of possible answers.", {"Model Result Index 0": {"sub_error": ["Invalid value for parameter 'date': '2023-10-13'. Expected one of ['next Friday']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"concert.find_nearby": {"location": "Berlin", "date": "2023-10-13", "genre": "classical", "amenities": ["Parking"]}}, "possible_answer_item": {"concert.find_nearby": {"location": ["Berlin"], "date": ["next Friday"], "genre": ["Classical", "classical"], "amenities": [["Parking"], ""]}}}}, {"Model Result Index 1": {"sub_error": ["Invalid value for parameter 'location': 'Paris'. Expected one of ['Berlin']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"concert.find_nearby": {"location": "Paris", "date": "2023-10-13", "genre": "classical", "amenities": ["Parking"]}}, "possible_answer_item": {"concert.find_nearby": {"location": ["Berlin"], "date": ["next Friday"], "genre": ["Classical", "classical"], "amenities": [["Parking"], ""]}}}}], "error_type": "parallel_function_checker_no_order:cannot_find_match", "prompt": {"id": "parallel_44", "question": [[{"role": "user", "content": "Find me all the classical concerts near Berlin and Paris happening next Friday, and I am interested only in those with available parking."}]], "function": [{"name": "concert.find_nearby", "description": "Locate nearby concerts based on specific criteria like genre and availability of parking.", "parameters": {"type": "dict", "properties": {"location": {"type": "string", "description": "The city where the user wants to find a concert."}, "date": {"type": "string", "description": "The date on which the user wants to attend a concert."}, "genre": {"type": "string", "description": "The genre of music of the concert."}, "amenities": {"type": "array", "items": {"type": "string", "enum": ["Parking", "Food and Beverages", "VIP Seating", "Disability Access"]}, "description": "Amenities preferred at the concert.", "default": ["Parking"]}}, "required": ["location", "date", "genre"]}}]}, "model_result_raw": "\n[concert.find_nearby(location='Berlin', date='2023-10-13', genre='classical', amenities=['Parking']), concert.find_nearby(location='Paris', date='2023-10-13', genre='classical', amenities=['Parking'])]", "model_result_decoded": [{"concert.find_nearby": {"location": "Berlin", "date": "2023-10-13", "genre": "classical", "amenities": ["Parking"]}}, {"concert.find_nearby": {"location": "Paris", "date": "2023-10-13", "genre": "classical", "amenities": ["Parking"]}}], "possible_answer": [{"concert.find_nearby": {"location": ["Berlin"], "date": ["next Friday"], "genre": ["Classical", "classical"], "amenities": [["Parking"], ""]}}, {"concert.find_nearby": {"location": ["Paris"], "date": ["next Friday"], "genre": ["Classical", "classical"], "amenities": [["Parking"], ""]}}]}
{"id": "parallel_89", "model_name": "D-CORE-14B", "test_category": "parallel", "valid": false, "error": ["Could not find a matching function among index [0, 1, 2] of model output for index 0 of possible answers.", {"Model Result Index 0": {"sub_error": ["Invalid value for parameter 'start_location': 'San Francisco home'. Expected one of ['San Francisco', 'SF']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"get_directions": {"start_location": "San Francisco home", "end_location": "Palo Alto office", "route_type": "fastest"}}, "possible_answer_item": {"get_directions": {"start_location": ["San Francisco", "SF"], "end_location": ["Palo Alto"], "route_type": ["fastest"]}}}}, {"Model Result Index 1": {"sub_error": ["Invalid value for parameter 'start_location': 'Palo Alto office'. Expected one of ['San Francisco', 'SF']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"get_directions": {"start_location": "Palo Alto office", "end_location": "Golden Gate Bridge, San Francisco", "route_type": "scenic"}}, "possible_answer_item": {"get_directions": {"start_location": ["San Francisco", "SF"], "end_location": ["Palo Alto"], "route_type": ["fastest"]}}}}, {"Model Result Index 2": {"sub_error": ["Invalid value for parameter 'start_location': 'Golden Gate Bridge'. Expected one of ['San Francisco', 'SF']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"get_directions": {"start_location": "Golden Gate Bridge", "end_location": "San Francisco home", "route_type": "fastest"}}, "possible_answer_item": {"get_directions": {"start_location": ["San Francisco", "SF"], "end_location": ["Palo Alto"], "route_type": ["fastest"]}}}}], "error_type": "parallel_function_checker_no_order:cannot_find_match", "prompt": {"id": "parallel_89", "question": [[{"role": "user", "content": "Can you provide me with the fastest route from my home in San Francisco to my office in Palo Alto and then a scenic route from Palo Alto to the Golden Gate Bridge in San Francisco, and finally the fastest route back to my home from the Golden Gate Bridge?"}]], "function": [{"name": "get_directions", "description": "Retrieve directions from one location to another.", "parameters": {"type": "dict", "properties": {"start_location": {"type": "string", "description": "The starting point of the journey."}, "end_location": {"type": "string", "description": "The destination point of the journey."}, "route_type": {"type": "string", "description": "Type of route to use (e.g., fastest, scenic). Default is fastest.", "enum": ["fastest", "scenic"]}}, "required": ["start_location", "end_location"]}}]}, "model_result_raw": "\n[get_directions(start_location=\"San Francisco home\", end_location=\"Palo Alto office\", route_type=\"fastest\"), get_directions(start_location=\"Palo Alto office\", end_location=\"Golden Gate Bridge, San Francisco\", route_type=\"scenic\"), get_directions(start_location=\"Golden Gate Bridge\", end_location=\"San Francisco home\", route_type=\"fastest\")]", "model_result_decoded": [{"get_directions": {"start_location": "San Francisco home", "end_location": "Palo Alto office", "route_type": "fastest"}}, {"get_directions": {"start_location": "Palo Alto office", "end_location": "Golden Gate Bridge, San Francisco", "route_type": "scenic"}}, {"get_directions": {"start_location": "Golden Gate Bridge", "end_location": "San Francisco home", "route_type": "fastest"}}], "possible_answer": [{"get_directions": {"start_location": ["San Francisco", "SF"], "end_location": ["Palo Alto"], "route_type": ["fastest"]}}, {"get_directions": {"start_location": ["Palo Alto"], "end_location": ["Golden Gate Bridge in San Francisco", "Golden Gate Bridge, San Francisco", "Golden Gate Bridge"], "route_type": ["scenic"]}}, {"get_directions": {"start_location": ["Golden Gate Bridge in San Francisco", "Golden Gate Bridge, San Francisco", "Golden Gate Bridge"], "end_location": ["San Francisco", "SF"], "route_type": ["fastest"]}}]}
{"id": "parallel_108", "model_name": "D-CORE-14B", "test_category": "parallel", "valid": false, "error": ["Could not find a matching function among index [1] of model output for index 1 of possible answers.", {"Model Result Index 1": {"sub_error": ["Invalid value for parameter 'cell_type': 'muscle cell'. Expected one of ['muscle']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"biology.get_cell_info": {"cell_type": "muscle cell"}}, "possible_answer_item": {"biology.get_cell_info": {"cell_type": ["muscle"], "detailed": [false, ""]}}}}], "error_type": "parallel_function_checker_no_order:cannot_find_match", "prompt": {"id": "parallel_108", "question": [[{"role": "user", "content": "Can you provide a detailed description of the structure and functioning of a neuron cell and then compare it with a less detailed description of a muscle cell in the human body?"}]], "function": [{"name": "biology.get_cell_info", "description": "Retrieve information about the structure and functioning of a specified type of cell", "parameters": {"type": "dict", "properties": {"cell_type": {"type": "string", "description": "Type of cell you want information about"}, "detailed": {"type": "boolean", "description": "Indicate if you want a detailed description of the cell", "default": "false"}}, "required": ["cell_type"]}}]}, "model_result_raw": "\n[biology.get_cell_info(cell_type='neuron', detailed=True), biology.get_cell_info(cell_type='muscle cell')]", "model_result_decoded": [{"biology.get_cell_info": {"cell_type": "neuron", "detailed": true}}, {"biology.get_cell_info": {"cell_type": "muscle cell"}}], "possible_answer": [{"biology.get_cell_info": {"cell_type": ["neuron"], "detailed": [true]}}, {"biology.get_cell_info": {"cell_type": ["muscle"], "detailed": [false, ""]}}]}
{"id": "parallel_126", "model_name": "D-CORE-14B", "test_category": "parallel", "valid": false, "error": ["Could not find a matching function among index [0, 1] of model output for index 0 of possible answers.", {"Model Result Index 0": {"sub_error": ["Invalid value for parameter 'species': 'African Elephants'. Expected one of ['African Elephant']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"prediction.evolution": {"species": "African Elephants", "years": 5000, "model": "Darwin"}}, "possible_answer_item": {"prediction.evolution": {"species": ["African Elephant"], "years": [5000], "model": ["Darwin", ""]}}}}, {"Model Result Index 1": {"sub_error": ["Invalid value for parameter 'species': 'African Elephants'. Expected one of ['African Elephant']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"prediction.evolution": {"species": "African Elephants", "years": 5000, "model": "Lamarck"}}, "possible_answer_item": {"prediction.evolution": {"species": ["African Elephant"], "years": [5000], "model": ["Darwin", ""]}}}}], "error_type": "parallel_function_checker_no_order:cannot_find_match", "prompt": {"id": "parallel_126", "question": [[{"role": "user", "content": "What would be the predicted evolutionary rate for the African Elephant species over a period of 5000 years using the Darwin model, and how would this prediction change if we use the Lamarck model instead?"}]], "function": [{"name": "prediction.evolution", "description": "Predict the evolutionary rate for a specific species for a given timeframe.", "parameters": {"type": "dict", "properties": {"species": {"type": "string", "description": "The species that the evolution rate will be predicted for."}, "years": {"type": "integer", "description": "Number of years for the prediction."}, "model": {"type": "string", "description": "The model used to make the prediction, options: 'Darwin', 'Lamarck', default is 'Darwin'."}}, "required": ["species", "years"]}}]}, "model_result_raw": "\n[prediction.evolution(species=\"African Elephants\", years=5000, model=\"Darwin\"), prediction.evolution(species=\"African Elephants\", years=5000, model=\"Lamarck\")]", "model_result_decoded": [{"prediction.evolution": {"species": "African Elephants", "years": 5000, "model": "Darwin"}}, {"prediction.evolution": {"species": "African Elephants", "years": 5000, "model": "Lamarck"}}], "possible_answer": [{"prediction.evolution": {"species": ["African Elephant"], "years": [5000], "model": ["Darwin", ""]}}, {"prediction.evolution": {"species": ["African Elephant"], "years": [5000], "model": ["Lamarck"]}}]}
{"id": "parallel_151", "model_name": "D-CORE-14B", "test_category": "parallel", "valid": false, "error": ["Could not find a matching function among index [0, 1, 2] of model output for index 0 of possible answers.", {"Model Result Index 0": {"sub_error": ["Invalid value for parameter 'unit': 'meters'. Expected one of ['square meters', 'm^2', '']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"geometry.area_triangle": {"base": 15, "height": 20, "unit": "meters"}}, "possible_answer_item": {"geometry.area_triangle": {"base": [15], "height": [20], "unit": ["square meters", "m^2", ""]}}}}, {"Model Result Index 1": {"sub_error": ["Invalid value for parameter 'base': 25. Expected one of [15]."], "sub_error_type": "value_error:others", "model_output_item": {"geometry.area_triangle": {"base": 25, "height": 30, "unit": "feet"}}, "possible_answer_item": {"geometry.area_triangle": {"base": [15], "height": [20], "unit": ["square meters", "m^2", ""]}}}}, {"Model Result Index 2": {"sub_error": ["Invalid value for parameter 'base': 35. Expected one of [15]."], "sub_error_type": "value_error:others", "model_output_item": {"geometry.area_triangle": {"base": 35, "height": 40, "unit": "inches"}}, "possible_answer_item": {"geometry.area_triangle": {"base": [15], "height": [20], "unit": ["square meters", "m^2", ""]}}}}], "error_type": "parallel_function_checker_no_order:cannot_find_match", "prompt": {"id": "parallel_151", "question": [[{"role": "user", "content": "\"Can you help me calculate the total area of three different triangles? The first triangle has a base of 15 meters and a height of 20 meters. The second triangle has a base of 25 feet and a height of 30 feet. And the third triangle has a base of 35 inches and a height of 40 inches. I would like the area of each triangle in their respective units.\""}]], "function": [{"name": "geometry.area_triangle", "description": "Calculate the area of a triangle.", "parameters": {"type": "dict", "properties": {"base": {"type": "integer", "description": "The length of the base of the triangle."}, "height": {"type": "integer", "description": "The height of the triangle from the base."}, "unit": {"type": "string", "description": "The measurement unit for the area. Defaults to square meters."}}, "required": ["base", "height"]}}]}, "model_result_raw": "\n[geometry.area_triangle(base=15, height=20, unit='meters'), geometry.area_triangle(base=25, height=30, unit='feet'), geometry.area_triangle(base=35, height=40, unit='inches')]", "model_result_decoded": [{"geometry.area_triangle": {"base": 15, "height": 20, "unit": "meters"}}, {"geometry.area_triangle": {"base": 25, "height": 30, "unit": "feet"}}, {"geometry.area_triangle": {"base": 35, "height": 40, "unit": "inches"}}], "possible_answer": [{"geometry.area_triangle": {"base": [15], "height": [20], "unit": ["square meters", "m^2", ""]}}, {"geometry.area_triangle": {"base": [25], "height": [30], "unit": ["square feet", "ft^2"]}}, {"geometry.area_triangle": {"base": [35], "height": [40], "unit": ["square inches", "in^2"]}}]}
{"id": "parallel_158", "model_name": "D-CORE-14B", "test_category": "parallel", "valid": false, "error": ["Wrong number of functions."], "error_type": "parallel_function_checker_no_order:wrong_count", "prompt": {"id": "parallel_158", "question": [[{"role": "user", "content": "You are a data scientist working on a project that requires you to generate random numbers from a normal distribution. You need to generate four random numbers: two from a normal distribution with a mean of 5 and a standard deviation of 2, and two from a normal distribution with a mean of 10 and a standard deviation of 3. How can you use the 'random.normalvariate' function to achieve this?"}]], "function": [{"name": "random.normalvariate", "description": "Generates a random number from a normal distribution given the mean and standard deviation.", "parameters": {"type": "dict", "properties": {"mu": {"type": "integer", "description": "Mean of the normal distribution."}, "sigma": {"type": "integer", "description": "Standard deviation of the normal distribution."}}, "required": ["mu", "sigma"]}}]}, "model_result_raw": "\n[random.normalvariate(mu=5, sigma=2), random.normalvariate(mu=5, sigma=2), random.normalvariate(mu=10, sigma=3), random.normalvariate(mu=10, sigma=3)]", "model_result_decoded": [{"random.normalvariate": {"mu": 5, "sigma": 2}}, {"random.normalvariate": {"mu": 5, "sigma": 2}}, {"random.normalvariate": {"mu": 10, "sigma": 3}}, {"random.normalvariate": {"mu": 10, "sigma": 3}}], "possible_answer": [{"random.normalvariate": {"mu": [5], "sigma": [2]}}, {"random.normalvariate": {"mu": [10], "sigma": [3]}}]}
{"id": "parallel_185", "model_name": "D-CORE-14B", "test_category": "parallel", "valid": false, "error": ["Could not find a matching function among index [1, 2, 3] of model output for index 1 of possible answers.", {"Model Result Index 1": {"sub_error": ["Invalid value for parameter 'species': 'African Elephant'. Expected one of ['African Elephants']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"estimate_population": {"species": "African Elephant", "country": "Kenya", "year": 2021}}, "possible_answer_item": {"estimate_population": {"species": ["African Elephants"], "country": ["Kenya"], "year": [2021]}}}}, {"Model Result Index 2": {"sub_error": ["Invalid value for parameter 'species': 'Bengal Tiger'. Expected one of ['African Elephants']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"estimate_population": {"species": "Bengal Tiger", "country": "India", "year": 2023}}, "possible_answer_item": {"estimate_population": {"species": ["African Elephants"], "country": ["Kenya"], "year": [2021]}}}}, {"Model Result Index 3": {"sub_error": ["Invalid value for parameter 'species': 'African Elephant'. Expected one of ['African Elephants']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"estimate_population": {"species": "African Elephant", "country": "Kenya", "year": 2023}}, "possible_answer_item": {"estimate_population": {"species": ["African Elephants"], "country": ["Kenya"], "year": [2021]}}}}], "error_type": "parallel_function_checker_no_order:cannot_find_match", "prompt": {"id": "parallel_185", "question": [[{"role": "user", "content": "Can you estimate the population of Bengal Tigers in India for the year 2021, compare it with the estimated population of African Elephants in Kenya for the same year, and then estimate the population of both these species in their respective countries for year 2023?"}]], "function": [{"name": "estimate_population", "description": "Estimate the population of a particular species in a given country.", "parameters": {"type": "dict", "properties": {"species": {"type": "string", "description": "The species for which population needs to be estimated."}, "country": {"type": "string", "description": "The country where the species lives."}, "year": {"type": "integer", "description": "The year for which population estimate is sought. Default is 2020."}}, "required": ["species", "country"]}}]}, "model_result_raw": "\n[estimate_population(species=\"Bengal Tiger\", country=\"India\", year=2021), estimate_population(species=\"African Elephant\", country=\"Kenya\", year=2021), estimate_population(species=\"Bengal Tiger\", country=\"India\", year=2023), estimate_population(species=\"African Elephant\", country=\"Kenya\", year=2023)]", "model_result_decoded": [{"estimate_population": {"species": "Bengal Tiger", "country": "India", "year": 2021}}, {"estimate_population": {"species": "African Elephant", "country": "Kenya", "year": 2021}}, {"estimate_population": {"species": "Bengal Tiger", "country": "India", "year": 2023}}, {"estimate_population": {"species": "African Elephant", "country": "Kenya", "year": 2023}}], "possible_answer": [{"estimate_population": {"species": ["Bengal Tigers", "Bengal Tiger"], "country": ["India"], "year": [2021]}}, {"estimate_population": {"species": ["African Elephants"], "country": ["Kenya"], "year": [2021]}}, {"estimate_population": {"species": ["Bengal Tigers", "Bengal Tiger"], "country": ["India"], "year": [""]}}, {"estimate_population": {"species": ["African Elephants"], "country": ["Kenya"], "year": [2023]}}]}
{"id": "parallel_193", "model_name": "D-CORE-14B", "test_category": "parallel", "valid": false, "error": ["Could not find a matching function among index [0, 1] of model output for index 0 of possible answers.", {"Model Result Index 0": {"sub_error": ["Invalid value for parameter 'body': 'progress report'. Expected one of ['Dear John, The project is progressing as planned and we are on track to meet our deadlines. Best, Alex']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"send_email": {"to": "john.doe@example.com", "subject": "Project Update", "body": "progress report", "cc": "manager@example.com", "bcc": "hr@example.com"}}, "possible_answer_item": {"send_email": {"to": ["john.doe@example.com"], "subject": ["Project Update"], "body": ["Dear John, The project is progressing as planned and we are on track to meet our deadlines. Best, Alex"], "cc": ["manager@example.com"], "bcc": ["hr@example.com"]}}}}, {"Model Result Index 1": {"sub_error": ["Invalid value for parameter 'to': 'jane.doe@example.com'. Expected one of ['john.doe@example.com']. Case insensitive."], "sub_error_type": "value_error:string", "model_output_item": {"send_email": {"to": "jane.doe@example.com", "subject": "Meeting Reminder", "body": "meeting details", "cc": "assistant@example.com", "bcc": "hr@example.com"}}, "possible_answer_item": {"send_email": {"to": ["john.doe@example.com"], "subject": ["Project Update"], "body": ["Dear John, The project is progressing as planned and we are on track to meet our deadlines. Best, Alex"], "cc": ["manager@example.com"], "bcc": ["hr@example.com"]}}}}], "error_type": "parallel_function_checker_no_order:cannot_find_match", "prompt": {"id": "parallel_193", "question": [[{"role": "user", "content": "Can you send an email to my colleague at john.doe@example.com with the subject \"Project Update\" and the body content \"Dear John, The project is progressing as planned and we are on track to meet our deadlines. Best, Alex\", then carbon copy the email to my manager at manager@example.com and blind carbon copy it to the HR at hr@example.com? After that, can you send another email to my other colleague at jane.doe@example.com with the subject \"Meeting Reminder\" and the body content \"Dear Jane, This is a reminder for our meeting scheduled for tomorrow at 10 AM. Best, Alex\", and carbon copy it to my assistant at assistant@example.com and blind carbon copy it to the HR at hr@example.com?"}]], "function": [{"name": "send_email", "description": "Send an email to the specified email address.", "parameters": {"type": "dict", "properties": {"to": {"type": "string", "description": "The email address to send to."}, "subject": {"type": "string", "description": "The subject of the email."}, "body": {"type": "string", "description": "The body content of the email."}, "cc": {"type": "string", "description": "The email address to carbon copy. default is ''."}, "bcc": {"type": "string", "description": "The email address to blind carbon copy. the value is set to '' for default."}}, "required": ["to", "subject", "body"]}}]}, "model_result_raw": "\n[send_email(to=\"john.doe@example.com\", subject=\"Project Update\", body=\"progress report\", cc=\"manager@example.com\", bcc=\"hr@example.com\"), send_email(to=\"jane.doe@example.com\", subject=\"Meeting Reminder\", body=\"meeting details\", cc=\"assistant@example.com\", bcc=\"hr@example.com\")]", "model_result_decoded": [{"send_email": {"to": "john.doe@example.com", "subject": "Project Update", "body": "progress report", "cc": "manager@example.com", "bcc": "hr@example.com"}}, {"send_email": {"to": "jane.doe@example.com", "subject": "Meeting Reminder", "body": "meeting details", "cc": "assistant@example.com", "bcc": "hr@example.com"}}], "possible_answer": [{"send_email": {"to": ["john.doe@example.com"], "subject": ["Project Update"], "body": ["Dear John, The project is progressing as planned and we are on track to meet our deadlines. Best, Alex"], "cc": ["manager@example.com"], "bcc": ["hr@example.com"]}}, {"send_email": {"to": ["jane.doe@example.com"], "subject": ["Meeting Reminder"], "body": ["Dear Jane, This is a reminder for our meeting scheduled for tomorrow at 10 AM. Best, Alex"], "cc": ["assistant@example.com"], "bcc": ["hr@example.com"]}}]}