methodA,methodB,isGolden,originalName,answerValue,answerer,wasDiscarded,modelProbability,answeredAt
alpaca-13b,gpt-3.5-turbo,false,mtbench-81,B,author_2,,,Fri Nov 08 2024 20:41:57 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-81,B,author_2,,,Mon Nov 11 2024 07:00:44 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-81,B,expert_17,,,Sat Jan 20 2024 13:28:50 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-81,B,expert_17,,,Sun Apr 14 2024 12:24:10 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-81,B,expert_0,,,Sat Nov 16 2024 00:20:21 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-81,Tie,expert_0,,,Wed Nov 27 2024 21:22:06 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-81,A,expert_37,,,Sat Aug 24 2024 10:37:25 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-81,A,expert_37,,,Sat Mar 23 2024 12:59:23 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-81,A,expert_27,,,Sun Dec 01 2024 09:11:46 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-81,Tie,expert_27,,,Sat May 25 2024 20:40:00 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-81,A,expert_24,,,Sat Oct 12 2024 12:08:59 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-81,A,expert_24,,,Sun Apr 28 2024 07:21:12 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-81,A,expert_45,,,Wed Dec 18 2024 03:31:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-81,A,expert_45,,,Thu Feb 08 2024 02:39:58 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-81,Tie,expert_11,,,Sun Sep 15 2024 13:24:53 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-81,A,expert_11,,,Sun Jun 02 2024 14:57:08 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-81,Tie,expert_24,,,Sat Jan 13 2024 21:33:18 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-81,A,expert_24,,,Mon May 20 2024 16:50:09 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-81,A,author_3,,,Wed Jan 03 2024 02:34:41 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-81,A,author_3,,,Mon Jan 15 2024 02:25:26 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-81,A,expert_43,,,Fri Mar 15 2024 23:55:01 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-81,A,expert_43,,,Thu Oct 03 2024 12:43:44 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-81,A,expert_3,,,Wed Jul 24 2024 04:21:30 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-81,A,expert_3,,,Fri Feb 16 2024 17:59:56 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-81,B,expert_0,,,Fri Feb 09 2024 01:12:30 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-81,Tie,expert_0,,,Mon Jan 08 2024 16:35:21 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-81,A,expert_10,,,Thu May 02 2024 09:51:11 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-81,A,expert_10,,,Mon Mar 04 2024 08:43:17 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-82,B,expert_46,,,Mon Apr 01 2024 11:58:18 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-82,B,expert_46,,,Sun Sep 01 2024 02:51:09 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-82,Tie,expert_46,,,Tue Oct 01 2024 19:24:43 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-82,A,expert_46,,,Sat Oct 19 2024 11:40:03 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-82,B,author_3,,,Thu Sep 12 2024 05:12:38 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-82,B,author_3,,,Mon Aug 19 2024 07:28:52 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-82,A,expert_31,,,Tue May 07 2024 14:31:00 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-82,A,expert_31,,,Wed Oct 02 2024 00:48:10 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-82,A,expert_20,,,Sat Jun 15 2024 21:54:24 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-82,A,expert_20,,,Thu Jul 11 2024 23:50:29 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-82,A,expert_28,,,Sun Mar 17 2024 12:18:31 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-82,A,expert_28,,,Sat Oct 19 2024 08:25:18 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-82,A,expert_40,,,Sun Sep 22 2024 02:39:59 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-82,B,expert_40,,,Mon Dec 16 2024 05:55:18 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-82,B,expert_24,,,Wed Mar 06 2024 10:15:37 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-82,Tie,expert_24,,,Mon Apr 22 2024 19:22:48 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-82,B,expert_26,,,Tue Dec 17 2024 16:38:50 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-82,B,expert_26,,,Fri Feb 16 2024 13:09:23 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-82,Tie,expert_24,,,Mon Mar 25 2024 11:04:11 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-82,B,expert_24,,,Wed Dec 04 2024 18:10:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-82,A,expert_46,,,Mon Dec 23 2024 13:21:27 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-82,B,expert_46,,,Tue Mar 26 2024 19:03:56 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-82,B,author_0,,,Sun Apr 14 2024 11:12:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-82,A,author_0,,,Mon Dec 02 2024 23:28:05 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-82,A,author_4,,,Wed Nov 06 2024 16:12:50 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-82,A,author_4,,,Sat Jul 27 2024 03:34:53 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-82,B,expert_28,,,Sun Nov 17 2024 17:35:06 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-82,A,expert_28,,,Wed Apr 10 2024 19:50:21 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-82,A,author_4,,,Sat Apr 27 2024 11:23:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-82,B,author_4,,,Mon May 20 2024 19:53:09 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-82,A,expert_2,,,Wed Jan 10 2024 15:38:25 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-82,B,expert_2,,,Tue Apr 02 2024 14:59:51 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-82,B,expert_20,,,Sun Aug 04 2024 07:25:10 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-82,B,expert_20,,,Fri Sep 06 2024 11:17:51 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-82,Tie,expert_24,,,Wed Jun 26 2024 11:43:01 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-82,Tie,expert_24,,,Fri Aug 09 2024 14:59:52 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-82,A,author_5,,,Thu Mar 21 2024 18:10:02 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-82,A,author_5,,,Sat Jul 20 2024 14:11:07 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-82,B,expert_2,,,Tue Jul 02 2024 06:09:02 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-82,B,expert_2,,,Thu Nov 21 2024 09:19:39 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-82,B,expert_50,,,Tue Oct 15 2024 06:47:13 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-82,B,expert_50,,,Thu May 16 2024 15:37:19 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-82,B,expert_57,,,Wed Feb 07 2024 14:31:40 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-82,A,expert_57,,,Tue Aug 13 2024 03:29:34 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-82,B,author_5,,,Mon Apr 01 2024 06:07:03 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-82,B,author_5,,,Tue Dec 10 2024 21:14:13 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-82,B,expert_48,,,Tue Aug 20 2024 18:21:47 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-82,B,expert_48,,,Fri Jul 12 2024 04:34:44 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-82,B,expert_51,,,Sat Mar 23 2024 10:56:50 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-82,B,expert_51,,,Tue Feb 06 2024 06:00:11 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-82,A,expert_21,,,Mon Jun 24 2024 07:20:30 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-82,B,expert_21,,,Wed Feb 14 2024 17:12:43 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-82,B,expert_50,,,Thu Jul 18 2024 17:26:20 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-82,A,expert_50,,,Wed Nov 27 2024 11:29:40 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-82,B,expert_11,,,Thu Jun 27 2024 18:03:49 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-82,B,expert_11,,,Sun Aug 11 2024 01:51:09 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-82,A,expert_45,,,Mon May 13 2024 04:15:49 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-82,A,expert_45,,,Tue Jun 18 2024 00:48:29 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-83,B,expert_1,,,Mon Apr 22 2024 03:24:29 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-83,B,expert_1,,,Thu Jul 04 2024 22:46:11 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-83,A,expert_12,,,Sat Sep 28 2024 16:30:59 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-83,A,expert_12,,,Mon Jan 08 2024 17:13:00 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-83,A,expert_23,,,Fri Nov 01 2024 14:02:41 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-83,B,expert_23,,,Tue Mar 26 2024 17:18:02 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-83,A,author_0,,,Sun Dec 01 2024 07:22:20 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-83,A,author_0,,,Sun May 12 2024 07:59:59 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-83,B,author_5,,,Mon Oct 14 2024 00:54:06 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-83,B,author_5,,,Wed Feb 21 2024 13:29:13 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-83,Tie,expert_42,,,Fri Jun 14 2024 18:51:20 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-83,A,expert_42,,,Wed Mar 27 2024 22:36:31 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-83,A,expert_8,,,Thu Jun 20 2024 10:40:12 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-83,A,expert_8,,,Sat Dec 14 2024 09:10:57 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-83,B,expert_36,,,Mon Sep 16 2024 19:19:24 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-83,A,expert_36,,,Tue May 07 2024 12:29:50 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-83,B,expert_51,,,Tue Dec 10 2024 16:58:54 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-83,B,expert_35,,,Fri Aug 23 2024 11:45:46 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-83,Tie,expert_35,,,Sat Sep 21 2024 13:19:43 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-83,B,expert_21,,,Sat Feb 17 2024 10:56:20 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-83,Tie,expert_21,,,Tue Mar 05 2024 08:30:09 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-83,B,expert_9,,,Fri Dec 13 2024 19:28:17 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-83,B,expert_9,,,Sun Nov 03 2024 11:43:32 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-83,B,expert_32,,,Sat Jan 27 2024 18:04:08 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-83,B,expert_32,,,Fri May 17 2024 21:43:15 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-83,Tie,author_4,,,Sat Jan 27 2024 00:27:50 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-83,B,author_4,,,Tue Dec 03 2024 02:40:23 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-83,Tie,expert_34,,,Mon Mar 04 2024 15:47:59 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-83,B,expert_34,,,Thu Sep 26 2024 03:03:30 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-83,A,expert_46,,,Mon May 20 2024 14:10:23 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-83,B,expert_46,,,Wed Aug 21 2024 12:34:05 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-83,A,expert_20,,,Tue Jul 02 2024 12:15:37 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-83,A,expert_20,,,Fri Jun 21 2024 19:57:44 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-84,B,expert_1,,,Fri May 03 2024 14:12:00 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-84,B,expert_1,,,Wed Dec 25 2024 23:01:22 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-84,A,expert_6,,,Fri Sep 06 2024 21:44:30 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-84,B,expert_6,,,Fri Jun 21 2024 02:16:35 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-84,A,expert_22,,,Mon Jan 08 2024 04:36:01 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-84,B,expert_22,,,Tue Mar 26 2024 01:58:57 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-84,B,expert_45,,,Sun Sep 22 2024 01:21:46 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-84,B,expert_45,,,Sun Mar 17 2024 10:08:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-84,A,author_4,,,Thu Mar 07 2024 14:19:01 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-84,A,author_4,,,Sat Jul 27 2024 16:27:17 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-84,Tie,expert_24,,,Sun Mar 03 2024 13:50:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-84,A,expert_24,,,Sun May 12 2024 17:39:04 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-84,B,expert_47,,,Sat Apr 27 2024 09:03:21 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-84,A,expert_47,,,Thu Dec 19 2024 14:36:17 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-84,Tie,expert_24,,,Fri Feb 23 2024 19:45:20 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-84,Tie,expert_24,,,Fri Dec 20 2024 00:12:44 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-84,B,author_4,,,Tue Dec 10 2024 11:22:35 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-84,Tie,author_4,,,Fri Nov 01 2024 15:24:14 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-84,A,expert_0,,,Thu Jul 18 2024 12:42:19 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-84,Tie,expert_0,,,Tue Jul 16 2024 05:58:09 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-84,A,expert_8,,,Sun Oct 13 2024 20:39:07 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-84,B,expert_8,,,Tue Jan 16 2024 18:34:56 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-84,A,author_2,,,Fri Nov 22 2024 09:38:16 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-84,B,author_2,,,Thu Dec 19 2024 19:06:10 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-84,B,expert_43,,,Mon Feb 05 2024 04:01:26 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-84,B,expert_43,,,Fri Jan 19 2024 07:13:30 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-85,B,author_5,,,Fri Apr 12 2024 02:00:31 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-85,B,author_5,,,Sun Feb 11 2024 07:24:33 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-85,B,expert_8,,,Mon Jun 24 2024 00:44:33 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-85,B,expert_8,,,Mon Oct 28 2024 06:55:20 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-85,A,expert_15,,,Mon Oct 21 2024 01:42:47 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-85,A,expert_15,,,Mon May 27 2024 02:20:25 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-85,B,expert_22,,,Sun Jul 14 2024 18:41:26 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-85,B,expert_22,,,Sun Jan 21 2024 01:09:29 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-85,A,expert_11,,,Tue May 07 2024 08:14:48 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-85,A,expert_11,,,Wed Dec 25 2024 02:56:18 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-85,A,expert_16,,,Tue Jan 23 2024 13:13:19 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-85,A,expert_16,,,Wed Aug 14 2024 05:15:54 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-85,Tie,author_0,,,Fri May 24 2024 02:25:06 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-85,Tie,author_0,,,Mon Sep 23 2024 06:35:08 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-85,A,expert_56,,,Mon Oct 28 2024 10:57:28 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-85,B,expert_56,,,Fri Jan 26 2024 20:42:20 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-85,A,expert_12,,,Sat Jul 20 2024 08:06:44 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-85,Tie,expert_12,,,Sun Mar 24 2024 22:49:07 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-85,A,expert_24,,,Thu Nov 21 2024 21:17:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-85,B,expert_24,,,Fri Oct 11 2024 19:47:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-85,B,expert_36,,,Tue Aug 06 2024 12:16:33 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-85,B,expert_36,,,Sat Aug 17 2024 08:56:06 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-85,Tie,expert_24,,,Sat Oct 12 2024 23:33:44 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-85,B,expert_24,,,Tue Mar 26 2024 17:27:48 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-85,A,expert_50,,,Wed Aug 07 2024 18:05:42 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-85,B,expert_50,,,Wed Oct 16 2024 10:15:20 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-85,A,expert_42,,,Wed Jun 26 2024 12:24:19 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-85,A,expert_42,,,Thu May 23 2024 09:53:50 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-85,A,expert_42,,,Sat Aug 03 2024 08:59:29 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-85,A,expert_42,,,Thu Feb 08 2024 19:58:05 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-85,A,expert_3,,,Sun May 19 2024 00:54:48 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-85,A,expert_3,,,Sat Feb 24 2024 06:08:06 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-85,B,expert_45,,,Thu Nov 28 2024 09:26:55 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-85,A,expert_45,,,Wed Dec 18 2024 21:24:04 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-85,A,expert_1,,,Thu Nov 28 2024 14:42:10 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-85,Tie,expert_1,,,Mon Jul 15 2024 22:23:45 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-85,Tie,expert_9,,,Sun May 26 2024 06:42:12 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-85,A,expert_9,,,Wed Aug 14 2024 01:23:45 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-85,B,expert_24,,,Wed Jun 19 2024 03:21:24 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-85,B,expert_24,,,Sat Nov 23 2024 17:30:46 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-85,A,expert_17,,,Sat May 25 2024 06:48:52 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-85,Tie,expert_17,,,Thu Jul 04 2024 10:57:36 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-85,A,author_3,,,Fri May 17 2024 08:30:28 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-85,Tie,author_3,,,Sat Apr 13 2024 01:02:44 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-85,Tie,expert_7,,,Sun Jan 14 2024 22:03:53 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-85,B,expert_7,,,Tue Oct 15 2024 10:13:14 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-85,Tie,author_0,,,Wed Jul 24 2024 19:10:54 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-85,Tie,author_0,,,Mon Jan 15 2024 12:20:27 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-85,B,expert_24,,,Sat Dec 14 2024 18:36:28 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-85,B,expert_24,,,Fri Apr 12 2024 15:52:10 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-85,A,expert_26,,,Thu Nov 07 2024 00:01:22 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-85,A,expert_26,,,Fri Feb 16 2024 02:39:49 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-86,Tie,expert_13,,,Sat Mar 23 2024 03:40:51 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-86,Tie,expert_13,,,Mon Dec 23 2024 15:02:42 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-86,B,expert_34,,,Wed Jun 12 2024 16:30:22 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-86,A,expert_34,,,Sun Jun 16 2024 14:05:34 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-86,A,expert_42,,,Sun Sep 22 2024 19:57:29 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-86,A,expert_42,,,Sun Feb 11 2024 04:45:00 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-86,Tie,expert_24,,,Tue Dec 03 2024 16:57:33 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-86,B,expert_24,,,Wed Jul 03 2024 10:21:17 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-86,Tie,expert_19,,,Sun Jun 02 2024 16:38:42 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-86,A,expert_19,,,Wed Nov 06 2024 05:49:55 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-86,A,author_0,,,Fri Sep 13 2024 12:44:16 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-86,A,author_0,,,Tue Sep 10 2024 05:55:31 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-86,A,expert_24,,,Thu Mar 21 2024 19:27:12 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-86,A,expert_24,,,Wed Jun 26 2024 18:05:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-86,A,expert_6,,,Mon Sep 16 2024 12:39:10 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-86,A,expert_6,,,Tue Jan 09 2024 04:27:04 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-86,B,expert_1,,,Wed Aug 21 2024 18:29:03 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-86,A,expert_1,,,Fri Nov 08 2024 22:41:53 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-86,A,expert_5,,,Wed Feb 07 2024 13:43:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-86,A,expert_5,,,Sun Nov 17 2024 05:59:01 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-86,A,expert_50,,,Fri Sep 13 2024 08:31:17 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-86,A,expert_50,,,Mon Jul 01 2024 16:30:55 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-86,A,expert_27,,,Tue Jan 09 2024 05:58:08 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-86,A,expert_27,,,Sun Jun 16 2024 13:10:47 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-86,A,expert_6,,,Wed Jun 05 2024 16:26:57 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-86,A,expert_6,,,Fri Sep 20 2024 03:49:04 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-86,A,expert_56,,,Sat Jan 13 2024 22:48:08 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-86,B,expert_56,,,Thu Jul 04 2024 13:54:38 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-86,B,expert_49,,,Wed Mar 20 2024 00:09:00 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-86,B,expert_49,,,Wed Jan 10 2024 20:20:15 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-86,Tie,expert_9,,,Wed Jun 05 2024 13:03:59 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-86,B,expert_9,,,Fri Dec 06 2024 13:42:18 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-86,A,expert_57,,,Wed Feb 14 2024 02:34:50 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-86,Tie,expert_57,,,Tue Nov 26 2024 04:49:02 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-86,Tie,expert_0,,,Wed May 22 2024 08:46:20 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-87,A,expert_42,,,Fri Apr 26 2024 00:39:24 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-87,A,expert_42,,,Sun Jul 21 2024 20:45:02 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-87,B,expert_29,,,Fri Feb 23 2024 16:49:22 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-87,B,expert_29,,,Mon Feb 26 2024 05:56:51 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-87,A,author_0,,,Sun Nov 24 2024 10:59:05 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-87,A,author_0,,,Tue Dec 03 2024 15:49:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-87,Tie,expert_31,,,Sun Sep 22 2024 11:39:18 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-87,Tie,expert_31,,,Tue Jul 23 2024 08:20:02 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-87,B,author_4,,,Thu May 09 2024 03:09:36 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-87,Tie,author_4,,,Fri Nov 08 2024 19:13:43 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-87,Tie,expert_13,,,Wed Nov 27 2024 12:58:53 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-87,A,expert_13,,,Mon Dec 16 2024 01:24:54 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-87,Tie,expert_24,,,Fri Mar 15 2024 21:30:45 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-87,A,expert_24,,,Tue Nov 19 2024 02:42:26 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-87,A,expert_32,,,Wed Jun 05 2024 09:06:04 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-87,A,expert_32,,,Sun Feb 11 2024 02:56:07 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-87,Tie,expert_24,,,Mon Sep 23 2024 00:39:24 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-87,B,expert_24,,,Mon Apr 15 2024 03:30:12 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-87,B,author_4,,,Tue Dec 24 2024 15:25:20 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-87,B,author_4,,,Tue May 07 2024 05:22:18 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-87,B,expert_21,,,Tue Jun 18 2024 17:18:19 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-87,Tie,expert_21,,,Tue Dec 17 2024 07:58:49 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-87,A,expert_22,,,Sat Oct 19 2024 06:22:42 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-87,B,expert_22,,,Sun Jun 02 2024 03:32:48 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-87,A,expert_20,,,Mon Jul 15 2024 17:41:02 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-87,A,expert_20,,,Thu Apr 11 2024 16:53:59 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-87,Tie,expert_9,,,Mon Dec 02 2024 14:08:24 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-87,B,expert_9,,,Fri Jul 12 2024 21:10:06 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-87,A,expert_0,,,Tue Feb 13 2024 13:00:37 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-87,A,expert_0,,,Thu Dec 19 2024 02:11:20 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-87,A,expert_4,,,Sun Jan 14 2024 22:51:09 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-87,A,expert_4,,,Sun Apr 07 2024 23:00:37 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-87,A,expert_51,,,Wed Jun 19 2024 11:10:34 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-87,A,expert_51,,,Mon Jun 17 2024 04:24:12 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-88,B,expert_25,,,Thu Oct 24 2024 03:48:40 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-88,A,expert_25,,,Sun Mar 24 2024 02:43:43 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-88,A,expert_37,,,Tue Oct 08 2024 03:43:43 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-88,A,expert_37,,,Mon Apr 08 2024 13:27:39 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-88,A,expert_36,,,Thu May 09 2024 12:46:09 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-88,A,expert_36,,,Tue Sep 03 2024 17:00:38 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-88,A,expert_37,,,Sun Oct 06 2024 18:21:01 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-88,A,expert_37,,,Fri Jan 19 2024 04:01:33 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-88,Tie,author_4,,,Sun Jun 02 2024 09:53:37 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-88,Tie,author_4,,,Fri Nov 15 2024 10:36:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-88,B,expert_12,,,Sat Apr 06 2024 07:58:10 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-88,A,expert_12,,,Mon Aug 19 2024 15:36:39 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-88,Tie,expert_55,,,Tue Nov 05 2024 00:28:58 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-88,B,expert_55,,,Fri Jun 21 2024 06:05:06 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-88,A,expert_11,,,Fri Jun 14 2024 00:06:09 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-88,A,expert_11,,,Mon Mar 25 2024 04:01:41 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-88,A,expert_15,,,Fri Mar 08 2024 23:37:12 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-88,B,expert_15,,,Sat Apr 06 2024 15:52:52 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-88,B,expert_10,,,Mon Feb 19 2024 11:06:44 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-88,A,expert_10,,,Sun Sep 22 2024 09:31:20 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-88,B,expert_26,,,Sat Jun 01 2024 07:56:46 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-88,A,expert_26,,,Tue Dec 24 2024 11:47:26 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-88,B,author_2,,,Sun Jul 28 2024 13:51:19 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-88,B,author_2,,,Tue Apr 23 2024 16:33:21 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-88,B,expert_11,,,Fri Jul 12 2024 14:52:31 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-88,B,expert_11,,,Mon Aug 19 2024 20:36:24 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-88,B,expert_15,,,Mon Feb 19 2024 14:23:19 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-88,A,expert_15,,,Tue May 14 2024 08:32:50 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-88,B,author_3,,,Sat Oct 26 2024 02:22:39 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-88,B,author_3,,,Sun Jun 16 2024 17:17:33 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-89,B,author_4,,,Sat Jun 01 2024 12:23:32 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-89,B,author_4,,,Thu Apr 25 2024 16:25:05 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-89,B,expert_9,,,Mon Oct 21 2024 02:54:07 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-89,A,expert_9,,,Mon Nov 04 2024 06:32:11 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-89,Tie,expert_1,,,Wed Aug 28 2024 15:14:06 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-89,A,expert_1,,,Sun Sep 15 2024 16:24:48 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-89,A,expert_16,,,Sun Jun 23 2024 16:16:05 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-89,B,expert_16,,,Wed Feb 14 2024 22:19:07 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-89,B,expert_8,,,Wed Jul 10 2024 10:06:10 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-89,A,expert_8,,,Tue Nov 05 2024 17:33:51 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-89,A,expert_1,,,Wed May 15 2024 10:30:55 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-89,A,expert_1,,,Sun Oct 06 2024 12:58:54 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-89,A,expert_20,,,Fri Feb 23 2024 23:21:49 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-89,B,expert_20,,,Sat Mar 09 2024 09:16:54 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-89,A,expert_37,,,Mon Aug 26 2024 22:53:40 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-89,A,expert_37,,,Mon Jan 01 2024 14:24:01 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-89,B,author_4,,,Fri Feb 09 2024 02:35:51 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-89,B,author_4,,,Fri Sep 27 2024 07:24:50 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-89,B,expert_26,,,Wed Mar 27 2024 19:36:35 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-89,A,expert_26,,,Thu Jul 25 2024 14:21:44 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-89,B,author_4,,,Thu Jan 04 2024 19:48:17 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-89,A,author_4,,,Tue Jan 09 2024 19:33:18 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-89,A,author_4,,,Sun Dec 01 2024 09:23:45 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-89,A,author_4,,,Fri Sep 13 2024 04:36:51 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-89,B,expert_32,,,Fri Feb 16 2024 14:10:06 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-89,B,expert_32,,,Sun May 26 2024 17:14:42 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-89,A,expert_10,,,Fri Apr 19 2024 03:32:38 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-89,B,expert_10,,,Sun Sep 22 2024 07:55:08 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-89,B,expert_50,,,Sun Aug 18 2024 03:22:31 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-89,B,expert_50,,,Wed Aug 21 2024 05:34:41 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-89,B,expert_9,,,Tue Oct 22 2024 23:36:51 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-89,B,expert_9,,,Sun Oct 20 2024 01:44:54 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-89,A,expert_56,,,Fri Jun 21 2024 17:09:44 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-89,Tie,expert_56,,,Mon Sep 02 2024 05:44:28 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-89,A,expert_14,,,Tue Jun 04 2024 21:41:07 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-89,B,expert_14,,,Wed Jan 17 2024 18:46:32 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-90,B,author_4,,,Fri Apr 26 2024 15:20:24 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-90,B,author_4,,,Sat Jan 20 2024 10:00:36 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-90,B,expert_31,,,Wed Dec 11 2024 14:20:21 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-90,Tie,expert_31,,,Wed Dec 04 2024 03:42:55 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-90,B,expert_50,,,Sun Jun 23 2024 19:41:08 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-90,B,expert_50,,,Sun Mar 03 2024 12:05:34 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-90,B,expert_9,,,Tue Jun 11 2024 06:26:32 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-90,B,expert_9,,,Thu Feb 01 2024 09:24:48 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-90,B,expert_7,,,Thu Dec 12 2024 08:32:25 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-90,A,expert_7,,,Sat Nov 09 2024 08:27:37 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-90,Tie,expert_0,,,Tue Aug 13 2024 12:10:47 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-90,A,expert_0,,,Fri Mar 01 2024 11:05:57 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-90,B,expert_11,,,Fri Aug 16 2024 17:21:38 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-90,A,expert_11,,,Wed Nov 06 2024 22:08:11 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-90,B,expert_0,,,Sun Mar 24 2024 14:46:47 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-90,Tie,expert_0,,,Sun Dec 22 2024 08:47:27 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-90,B,expert_4,,,Mon Sep 02 2024 11:11:58 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-90,B,expert_4,,,Thu Jun 20 2024 01:50:07 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-90,A,author_3,,,Mon Jul 15 2024 22:00:55 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-90,A,author_3,,,Sat May 11 2024 14:34:37 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-90,A,expert_40,,,Thu Sep 05 2024 21:47:56 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-90,A,expert_40,,,Thu Mar 28 2024 04:34:02 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-90,Tie,author_0,,,Wed Dec 18 2024 03:31:04 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-90,Tie,author_0,,,Wed Jun 26 2024 12:09:01 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-90,A,author_4,,,Thu Jul 04 2024 14:43:51 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-90,A,author_4,,,Tue Aug 13 2024 04:45:25 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-90,A,expert_48,,,Mon Dec 16 2024 23:49:06 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-90,A,expert_48,,,Fri Apr 05 2024 06:45:45 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-90,Tie,expert_21,,,Sat Dec 14 2024 19:31:32 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-90,B,expert_21,,,Fri Aug 16 2024 08:00:25 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-90,B,expert_43,,,Wed Feb 21 2024 02:02:51 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-90,A,expert_43,,,Wed Jun 05 2024 20:18:16 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-90,B,expert_27,,,Sun Jan 28 2024 12:28:04 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-90,B,expert_27,,,Wed Jun 12 2024 02:21:58 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-90,B,expert_0,,,Tue Sep 03 2024 03:33:16 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-90,B,expert_0,,,Sat Sep 14 2024 08:02:27 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-90,B,expert_0,,,Fri Feb 09 2024 09:23:05 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-90,B,expert_0,,,Tue Apr 09 2024 02:31:32 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-90,B,expert_28,,,Thu Feb 22 2024 23:59:53 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-90,B,expert_28,,,Sun Jan 28 2024 00:32:44 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-90,A,expert_50,,,Sun Mar 24 2024 21:22:05 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-90,B,expert_50,,,Mon Jun 10 2024 11:20:35 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-90,Tie,expert_32,,,Tue Jun 18 2024 21:41:28 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-90,Tie,expert_32,,,Sun Jul 28 2024 20:23:03 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-90,B,expert_19,,,Tue Dec 17 2024 11:39:41 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-90,B,expert_19,,,Tue Feb 06 2024 11:41:56 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-91,B,author_2,,,Sun Jan 07 2024 01:29:34 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-91,B,author_2,,,Sun Dec 08 2024 04:59:51 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-91,A,expert_35,,,Sat Feb 24 2024 11:28:36 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-91,A,expert_35,,,Mon Jun 17 2024 11:51:06 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-91,B,expert_40,,,Sat May 11 2024 03:58:39 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-91,B,expert_40,,,Sat Jul 20 2024 14:33:46 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-91,B,expert_13,,,Mon Feb 26 2024 11:17:12 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-91,A,expert_13,,,Sat Aug 03 2024 12:56:30 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-91,A,expert_39,,,Mon Dec 16 2024 23:50:36 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-91,B,expert_39,,,Wed Apr 24 2024 11:19:14 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-91,A,expert_14,,,Tue Mar 19 2024 03:33:04 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-91,A,expert_14,,,Mon Dec 16 2024 14:13:39 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-91,A,expert_17,,,Mon Nov 11 2024 13:15:14 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-91,B,expert_17,,,Fri May 03 2024 03:20:34 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-91,A,expert_23,,,Thu Feb 08 2024 11:00:36 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-91,A,expert_23,,,Fri Apr 12 2024 17:16:04 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-91,A,expert_3,,,Tue Oct 15 2024 23:40:50 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-91,A,expert_3,,,Mon Aug 05 2024 20:25:39 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-91,A,expert_43,,,Tue Feb 06 2024 05:32:47 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-91,A,expert_43,,,Sat Apr 06 2024 07:30:08 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-91,Tie,author_4,,,Tue Oct 01 2024 02:20:26 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-91,A,author_4,,,Sat Aug 10 2024 21:27:38 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-91,B,expert_0,,,Thu Aug 08 2024 21:16:26 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-91,A,expert_0,,,Sun Aug 18 2024 22:11:17 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-91,B,expert_2,,,Mon Apr 15 2024 09:24:17 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-91,Tie,expert_2,,,Tue Dec 03 2024 14:19:52 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-91,Tie,author_4,,,Thu Sep 26 2024 02:03:12 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-91,Tie,author_4,,,Sun Aug 25 2024 23:43:05 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-91,Tie,expert_18,,,Fri Sep 20 2024 12:19:47 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-91,A,expert_18,,,Sat Jul 06 2024 11:42:41 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-91,Tie,expert_7,,,Fri Jan 05 2024 10:52:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-91,Tie,expert_7,,,Thu Oct 10 2024 22:44:06 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-91,A,author_0,,,Mon Aug 12 2024 15:51:00 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-91,A,author_0,,,Tue Aug 06 2024 20:21:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-91,B,author_4,,,Thu Jun 20 2024 02:12:02 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-91,A,author_4,,,Sun Jul 14 2024 09:12:50 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-91,B,expert_24,,,Tue May 07 2024 19:39:17 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-91,A,expert_24,,,Sat May 11 2024 12:44:47 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-91,A,expert_29,,,Tue Oct 01 2024 07:05:44 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-91,A,expert_29,,,Tue Jun 04 2024 13:16:13 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-91,Tie,expert_2,,,Sun Feb 04 2024 05:56:59 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-91,Tie,expert_2,,,Wed Apr 03 2024 10:03:06 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-91,Tie,expert_31,,,Wed Dec 11 2024 17:21:01 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-91,A,expert_31,,,Thu Feb 15 2024 12:32:33 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-91,B,author_4,,,Mon Feb 12 2024 10:10:19 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-91,B,author_4,,,Fri Oct 25 2024 09:54:25 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-91,B,expert_26,,,Sat Aug 17 2024 02:53:19 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-91,B,expert_26,,,Thu Mar 14 2024 20:50:34 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-91,B,expert_35,,,Wed Oct 16 2024 08:10:23 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-91,B,expert_35,,,Mon Aug 05 2024 15:48:42 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-91,B,expert_4,,,Tue Sep 03 2024 16:15:37 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-91,B,expert_4,,,Wed Jan 17 2024 22:39:18 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-91,Tie,author_0,,,Sun Jul 14 2024 14:55:07 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-91,B,author_0,,,Thu Jul 18 2024 04:34:06 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-91,Tie,expert_0,,,Sat Dec 21 2024 11:50:13 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-91,B,expert_0,,,Mon Apr 08 2024 15:38:59 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-91,A,expert_40,,,Thu May 02 2024 14:33:42 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-91,A,expert_40,,,Fri Feb 16 2024 13:59:32 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-92,B,expert_0,,,Sat Feb 03 2024 17:39:10 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-92,B,expert_0,,,Sun Jun 02 2024 14:12:12 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-92,B,expert_29,,,Mon Nov 11 2024 10:23:39 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-92,Tie,expert_29,,,Wed Oct 16 2024 03:28:10 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-92,B,expert_21,,,Thu Sep 12 2024 00:05:40 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-92,Tie,expert_21,,,Tue Oct 08 2024 22:15:39 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-92,B,author_5,,,Sun Oct 06 2024 04:47:21 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-92,A,author_5,,,Mon Apr 08 2024 18:38:32 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-92,B,expert_50,,,Mon Jan 08 2024 21:02:03 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-92,B,expert_50,,,Sat Nov 09 2024 15:23:39 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-92,A,author_0,,,Mon Apr 15 2024 16:44:59 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-92,B,author_0,,,Sat Dec 21 2024 03:29:38 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-92,A,expert_26,,,Mon Apr 15 2024 06:49:58 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-92,A,expert_26,,,Mon Jul 01 2024 14:47:25 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-92,A,author_0,,,Mon Aug 05 2024 02:32:37 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-92,A,author_0,,,Mon Jul 01 2024 03:09:16 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-92,A,author_6,,,Fri Dec 27 2024 14:42:50 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-92,Tie,author_6,,,Mon Mar 11 2024 11:03:23 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-92,A,expert_44,,,Sat Apr 20 2024 20:45:35 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-92,B,expert_44,,,Mon Nov 04 2024 00:49:51 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-92,B,author_4,,,Sat Oct 05 2024 15:35:16 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-92,B,author_4,,,Wed Aug 28 2024 00:45:09 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-92,B,expert_14,,,Sat Mar 02 2024 10:01:56 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-92,B,expert_14,,,Fri May 17 2024 05:20:24 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-92,B,author_4,,,Tue Jan 16 2024 04:27:00 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-92,A,author_4,,,Sun Feb 11 2024 19:44:32 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-92,A,author_0,,,Tue Apr 09 2024 06:32:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-92,A,author_0,,,Sat Oct 05 2024 10:59:18 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-92,A,expert_34,,,Mon Oct 28 2024 14:20:38 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-92,A,expert_34,,,Sat Jul 20 2024 01:50:08 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-92,B,author_0,,,Thu Sep 12 2024 06:43:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-92,B,author_0,,,Tue Aug 13 2024 14:12:37 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-92,A,expert_0,,,Tue Oct 01 2024 19:11:28 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-92,A,expert_0,,,Sat May 11 2024 14:39:23 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-92,A,expert_36,,,Thu Feb 01 2024 00:59:19 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-92,B,expert_36,,,Tue Mar 05 2024 04:56:27 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-92,B,expert_3,,,Tue May 07 2024 18:09:56 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-92,B,expert_3,,,Thu Mar 07 2024 09:36:10 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-92,B,expert_41,,,Wed Jun 19 2024 00:45:13 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-92,B,expert_41,,,Sun Jun 02 2024 05:05:46 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-92,A,expert_24,,,Sat Aug 24 2024 19:58:22 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-92,B,expert_24,,,Tue Sep 24 2024 08:23:56 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-92,B,expert_0,,,Tue Dec 10 2024 11:25:52 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-92,B,expert_0,,,Sun Dec 08 2024 04:49:01 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-92,B,expert_4,,,Tue Jan 23 2024 19:16:46 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-92,B,expert_4,,,Fri Jan 05 2024 23:51:18 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-92,B,expert_55,,,Sat Oct 05 2024 23:30:25 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-92,Tie,expert_55,,,Thu May 02 2024 20:11:42 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-92,A,expert_40,,,Sun Sep 15 2024 06:39:37 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-92,Tie,expert_40,,,Sat Mar 16 2024 00:36:03 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-92,A,expert_8,,,Mon Jan 08 2024 10:32:52 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-92,B,expert_8,,,Mon Oct 28 2024 07:40:53 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-92,A,expert_38,,,Sat Jun 22 2024 07:08:59 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-92,B,expert_38,,,Wed Nov 13 2024 12:32:32 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-92,B,expert_55,,,Fri Jan 19 2024 08:44:30 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-92,B,expert_55,,,Mon Mar 18 2024 07:32:50 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-92,Tie,expert_24,,,Fri Jan 19 2024 07:32:32 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-92,A,expert_24,,,Sun Dec 15 2024 07:27:31 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-93,B,expert_0,,,Wed Oct 23 2024 21:25:35 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-93,B,expert_0,,,Sat Feb 10 2024 08:23:30 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-93,B,expert_16,,,Wed Aug 14 2024 09:39:18 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-93,B,expert_16,,,Mon Mar 25 2024 17:49:21 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-93,A,author_5,,,Mon Oct 14 2024 04:55:00 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-93,A,author_5,,,Thu Mar 07 2024 12:53:23 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-93,B,expert_33,,,Fri Dec 06 2024 19:32:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-93,A,expert_33,,,Fri Jun 21 2024 13:58:33 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-93,B,author_0,,,Thu Oct 03 2024 17:14:18 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-93,B,author_0,,,Mon Jan 22 2024 20:39:55 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-93,A,author_6,,,Sat Jun 01 2024 04:43:34 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-93,B,author_6,,,Mon Jan 15 2024 03:11:51 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-93,B,expert_9,,,Fri Mar 08 2024 03:43:02 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-93,A,expert_9,,,Wed Jan 10 2024 17:19:25 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-93,B,author_4,,,Sun Mar 10 2024 14:21:12 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-93,Tie,author_4,,,Sat Apr 06 2024 20:18:04 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-93,A,expert_13,,,Sat May 04 2024 23:48:04 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-93,A,expert_13,,,Mon Aug 19 2024 00:59:43 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-93,A,expert_24,,,Fri Jul 05 2024 13:26:35 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-93,A,expert_24,,,Sat Mar 02 2024 18:05:57 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-93,A,expert_32,,,Sun Feb 11 2024 07:07:05 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-93,A,expert_32,,,Thu Jan 25 2024 03:37:48 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-93,Tie,expert_24,,,Fri Oct 11 2024 09:33:04 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-93,A,expert_24,,,Fri Apr 12 2024 21:57:43 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-93,A,expert_44,,,Sun Oct 20 2024 13:32:08 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-93,B,expert_44,,,Sat Aug 24 2024 19:16:47 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-93,B,author_2,,,Wed Sep 04 2024 22:45:37 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-93,B,author_2,,,Sat Dec 14 2024 09:26:12 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-93,B,expert_38,,,Sun Nov 24 2024 11:25:44 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-93,B,expert_38,,,Thu Sep 19 2024 07:08:06 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-93,B,author_2,,,Thu Dec 05 2024 19:14:30 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-93,B,author_2,,,Thu Feb 01 2024 13:02:33 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-93,B,expert_0,,,Fri Jun 21 2024 10:10:31 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-93,B,expert_0,,,Thu Sep 26 2024 06:11:40 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-93,B,expert_29,,,Sat Jul 13 2024 23:02:55 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-93,B,expert_29,,,Thu Sep 12 2024 02:17:16 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-93,A,expert_8,,,Fri Aug 02 2024 23:49:18 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-93,A,expert_8,,,Thu Jun 13 2024 07:27:50 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-94,B,expert_10,,,Mon Sep 23 2024 22:33:03 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-94,B,expert_10,,,Tue Sep 24 2024 14:20:07 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-94,B,expert_31,,,Sun Dec 15 2024 02:34:20 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-94,B,expert_31,,,Sat Oct 19 2024 12:52:18 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-94,A,expert_2,,,Sun May 05 2024 12:36:21 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-94,A,expert_2,,,Mon Oct 28 2024 22:37:46 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-94,A,expert_12,,,Tue May 28 2024 19:52:07 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-94,A,expert_12,,,Fri Aug 23 2024 07:03:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-94,A,expert_1,,,Mon Jun 17 2024 18:54:51 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-94,B,expert_1,,,Mon Jun 10 2024 16:41:39 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-94,Tie,author_0,,,Fri Jun 21 2024 16:16:59 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-94,B,author_0,,,Thu Nov 28 2024 06:41:55 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-94,B,expert_27,,,Fri Dec 13 2024 02:40:28 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-94,B,expert_27,,,Mon Jan 15 2024 02:35:18 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-94,A,expert_39,,,Sun Sep 01 2024 13:55:45 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-94,A,expert_39,,,Thu Apr 11 2024 04:07:58 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-94,A,author_4,,,Wed Jul 24 2024 22:01:09 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-94,Tie,author_4,,,Sat May 11 2024 05:41:04 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-94,B,expert_50,,,Sun Sep 08 2024 10:59:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-94,B,expert_50,,,Wed Dec 18 2024 14:34:33 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-94,A,author_2,,,Thu Jun 20 2024 18:15:19 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-94,A,author_2,,,Sun Mar 17 2024 16:47:08 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-94,B,expert_6,,,Sat Jan 06 2024 14:50:50 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-94,B,expert_6,,,Fri Oct 25 2024 17:27:20 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-94,B,expert_12,,,Wed Jul 03 2024 09:12:42 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-94,A,expert_12,,,Fri Dec 20 2024 04:44:26 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-94,Tie,expert_47,,,Sat Sep 14 2024 02:42:35 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-94,A,expert_47,,,Fri Oct 18 2024 02:45:41 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-94,A,expert_5,,,Fri Nov 22 2024 01:24:27 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-94,B,expert_5,,,Mon Dec 23 2024 22:09:19 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-94,A,expert_6,,,Thu Aug 01 2024 22:12:13 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-94,A,expert_6,,,Tue Jun 25 2024 09:32:42 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-95,Tie,author_3,,,Tue Nov 26 2024 17:09:11 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-95,B,author_3,,,Tue Apr 09 2024 23:37:01 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-95,A,expert_16,,,Tue Jun 04 2024 17:24:45 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-95,Tie,expert_16,,,Sun Apr 21 2024 05:43:27 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-95,A,expert_28,,,Sun May 26 2024 08:02:44 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-95,B,expert_28,,,Wed Apr 24 2024 18:38:19 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-95,B,expert_38,,,Mon Mar 04 2024 17:20:37 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-95,Tie,expert_38,,,Tue Mar 12 2024 09:27:12 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-95,B,author_4,,,Sat May 11 2024 02:01:03 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-95,A,author_4,,,Tue Jan 02 2024 17:02:41 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-95,B,expert_24,,,Wed Oct 09 2024 10:37:27 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-95,A,expert_24,,,Fri Mar 22 2024 04:17:09 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-95,A,author_0,,,Mon Oct 07 2024 13:19:42 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-95,A,expert_6,,,Wed Dec 18 2024 18:16:25 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-95,A,expert_6,,,Sat Mar 09 2024 07:46:56 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-95,B,expert_29,,,Tue May 28 2024 17:02:55 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-95,B,expert_29,,,Sat Jan 06 2024 22:38:53 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-95,A,expert_53,,,Wed Dec 25 2024 21:27:13 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-95,A,expert_53,,,Thu Jan 18 2024 14:54:47 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-95,B,expert_57,,,Sun Apr 21 2024 17:04:44 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-95,B,expert_57,,,Sat May 25 2024 04:48:03 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-95,A,expert_11,,,Tue Nov 26 2024 00:51:32 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-95,A,expert_11,,,Thu Nov 07 2024 03:34:08 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-95,A,expert_55,,,Tue Feb 20 2024 07:49:09 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-95,A,expert_55,,,Tue Nov 05 2024 04:03:17 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-95,A,author_3,,,Sat Feb 10 2024 16:29:29 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-95,Tie,author_3,,,Fri Apr 26 2024 18:10:29 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-95,B,expert_10,,,Sat Jul 27 2024 15:59:42 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-95,B,expert_10,,,Tue Aug 13 2024 03:48:04 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-95,B,expert_24,,,Fri Aug 16 2024 13:31:15 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-95,B,expert_24,,,Mon Mar 11 2024 05:21:26 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-95,B,expert_39,,,Thu May 02 2024 01:13:57 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-95,B,expert_39,,,Thu Apr 11 2024 01:16:37 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-95,A,expert_49,,,Sat Mar 02 2024 02:55:58 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-95,Tie,expert_49,,,Fri Feb 23 2024 18:46:07 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-95,Tie,expert_9,,,Sun Mar 03 2024 01:39:08 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-95,Tie,expert_9,,,Fri Jul 12 2024 13:18:35 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-95,B,author_0,,,Tue Mar 26 2024 06:12:31 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-95,B,author_0,,,Sun Sep 08 2024 09:29:42 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-95,B,expert_19,,,Thu Jan 18 2024 18:18:07 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-95,B,expert_19,,,Mon Apr 01 2024 18:20:09 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-96,B,author_2,,,Fri Jun 07 2024 13:23:34 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-96,B,author_2,,,Sun Nov 24 2024 18:25:05 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-96,B,expert_51,,,Thu Nov 21 2024 12:58:56 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-96,B,expert_51,,,Sat Nov 02 2024 23:24:22 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-96,A,author_0,,,Tue Dec 17 2024 04:42:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-96,Tie,author_0,,,Fri Sep 06 2024 08:33:50 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-96,A,expert_15,,,Tue Aug 06 2024 10:32:43 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-96,A,expert_15,,,Wed Nov 20 2024 05:22:04 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-96,A,expert_24,,,Wed Jan 24 2024 08:06:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-96,A,expert_24,,,Sun Mar 17 2024 04:54:02 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-96,A,author_0,,,Fri Jan 12 2024 14:44:13 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-96,A,author_0,,,Tue Nov 12 2024 19:48:50 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-96,A,author_6,,,Sun Nov 10 2024 15:17:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-96,A,author_6,,,Mon Jul 01 2024 14:31:16 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-96,A,expert_43,,,Sat May 04 2024 18:41:58 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-96,A,expert_43,,,Sat Dec 07 2024 00:18:52 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-96,B,expert_44,,,Mon May 20 2024 23:03:36 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-96,A,expert_44,,,Fri Nov 01 2024 20:55:22 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-96,A,expert_50,,,Thu Jan 18 2024 18:01:18 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-96,B,expert_50,,,Wed Jul 10 2024 16:22:51 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-96,A,expert_51,,,Thu Jun 06 2024 00:49:53 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-96,A,expert_51,,,Sat Jan 20 2024 19:05:54 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-96,A,expert_27,,,Thu Jan 25 2024 02:52:23 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-96,B,expert_27,,,Fri Apr 05 2024 21:36:32 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-96,B,expert_16,,,Mon Jul 01 2024 03:13:51 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-96,B,expert_16,,,Wed May 15 2024 17:58:05 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-96,A,expert_37,,,Sun May 26 2024 22:03:10 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-96,B,expert_37,,,Thu May 09 2024 22:35:19 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-96,Tie,expert_25,,,Sat Dec 14 2024 06:31:56 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-96,Tie,expert_24,,,Fri Mar 22 2024 09:51:10 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-96,B,expert_24,,,Mon Dec 02 2024 22:02:20 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-97,B,expert_30,,,Tue Aug 20 2024 00:38:49 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-97,B,expert_30,,,Sat Jun 22 2024 06:18:14 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-97,B,expert_23,,,Tue Jul 09 2024 08:35:41 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-97,A,expert_23,,,Thu Apr 11 2024 17:49:49 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-97,A,expert_42,,,Mon Mar 18 2024 21:27:00 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-97,B,expert_42,,,Tue Apr 23 2024 06:56:02 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-97,A,expert_43,,,Thu Jun 27 2024 14:48:51 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-97,A,expert_43,,,Mon Aug 12 2024 10:53:50 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-97,A,expert_28,,,Thu Jun 27 2024 02:31:37 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-97,A,expert_28,,,Thu Dec 12 2024 12:44:00 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-97,A,expert_13,,,Thu Sep 05 2024 13:07:19 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-97,B,expert_13,,,Wed Oct 02 2024 04:13:35 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-97,B,expert_9,,,Wed Aug 28 2024 16:00:41 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-97,A,expert_9,,,Mon Mar 18 2024 02:03:23 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-97,A,expert_57,,,Mon Jan 01 2024 07:59:58 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-97,A,expert_57,,,Wed Feb 07 2024 22:43:05 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-97,B,expert_24,,,Sun Nov 17 2024 10:31:20 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-97,B,expert_24,,,Mon Nov 18 2024 20:23:52 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-97,B,expert_38,,,Tue Aug 06 2024 12:23:01 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-97,B,expert_38,,,Mon Jan 15 2024 15:37:50 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-97,A,expert_24,,,Thu Mar 14 2024 10:15:27 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-97,A,expert_24,,,Wed Jul 24 2024 18:31:41 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-97,Tie,author_0,,,Sat Oct 05 2024 03:45:52 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-97,Tie,author_0,,,Wed May 01 2024 06:17:57 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-97,Tie,expert_0,,,Sun Jul 14 2024 12:23:15 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-97,Tie,expert_0,,,Wed Jan 03 2024 02:00:37 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-97,Tie,expert_31,,,Thu Nov 07 2024 04:49:27 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-97,Tie,expert_31,,,Wed Jul 17 2024 00:42:04 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-97,B,expert_46,,,Wed Nov 20 2024 00:52:28 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-97,A,expert_46,,,Tue May 07 2024 01:19:21 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-97,A,expert_57,,,Mon Dec 02 2024 21:35:58 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-97,A,expert_57,,,Thu May 16 2024 20:08:38 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-97,A,author_0,,,Sat Nov 02 2024 08:01:31 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-97,A,author_0,,,Wed Jun 26 2024 11:19:53 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-97,A,expert_27,,,Wed Jun 26 2024 13:11:39 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-97,A,expert_27,,,Tue Aug 06 2024 09:06:53 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-97,A,expert_15,,,Tue Apr 02 2024 17:53:41 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-97,A,expert_15,,,Sat May 04 2024 01:39:41 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-97,A,expert_50,,,Fri Jun 21 2024 04:04:35 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-97,Tie,expert_50,,,Mon Dec 23 2024 17:28:43 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-97,B,expert_40,,,Thu Oct 24 2024 15:22:33 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-97,B,expert_40,,,Sun Aug 11 2024 04:26:45 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-97,B,expert_23,,,Thu Sep 05 2024 01:44:30 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-97,A,expert_23,,,Tue May 07 2024 18:02:24 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-97,B,expert_15,,,Sat Jun 22 2024 19:18:49 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-97,A,expert_15,,,Tue Jan 23 2024 21:18:51 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-97,A,expert_51,,,Mon Mar 18 2024 19:04:03 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-97,B,expert_51,,,Wed Mar 06 2024 16:39:46 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-97,A,expert_14,,,Sun Apr 07 2024 11:42:10 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-97,B,expert_14,,,Thu Jan 18 2024 09:05:58 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-97,A,author_6,,,Tue Oct 08 2024 04:03:48 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-97,A,author_6,,,Wed Apr 24 2024 22:45:12 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-97,A,expert_53,,,Thu Jan 18 2024 19:12:34 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-97,A,expert_53,,,Sun Aug 04 2024 11:41:49 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-98,A,expert_1,,,Sun Nov 10 2024 23:15:06 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-98,A,expert_1,,,Sun May 26 2024 22:51:01 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-98,A,expert_21,,,Fri Feb 09 2024 06:20:06 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-98,A,expert_21,,,Sat May 04 2024 20:34:31 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-98,B,expert_16,,,Thu Dec 05 2024 15:34:55 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-98,B,expert_16,,,Wed Jul 17 2024 15:17:57 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-98,A,expert_13,,,Sat Feb 17 2024 13:34:27 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-98,A,expert_13,,,Thu Mar 28 2024 12:08:01 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-98,A,expert_44,,,Mon Oct 21 2024 10:08:24 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-98,A,expert_44,,,Sun Dec 15 2024 04:29:16 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-98,B,expert_0,,,Tue Apr 02 2024 22:00:04 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-98,A,expert_0,,,Mon Dec 23 2024 19:52:07 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-98,A,expert_21,,,Sat Feb 17 2024 09:06:23 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-98,A,expert_21,,,Fri Oct 25 2024 19:33:33 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-98,A,expert_55,,,Sun Apr 28 2024 17:42:34 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-98,A,expert_55,,,Fri Sep 06 2024 10:40:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-98,A,expert_47,,,Tue Dec 10 2024 20:56:43 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-98,A,expert_47,,,Mon Oct 14 2024 17:06:36 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-98,B,author_4,,,Fri May 17 2024 21:03:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-98,A,author_4,,,Sun Dec 22 2024 13:34:01 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-98,B,expert_9,,,Sun Oct 20 2024 01:34:35 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-98,B,expert_9,,,Sun May 12 2024 13:15:10 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-98,Tie,expert_2,,,Mon Feb 12 2024 04:15:13 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-98,Tie,expert_2,,,Fri Aug 16 2024 11:21:01 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-98,A,expert_54,,,Mon Dec 16 2024 22:16:02 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-98,A,expert_54,,,Thu May 16 2024 17:20:08 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-98,B,expert_16,,,Wed Sep 04 2024 18:05:26 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-98,B,expert_16,,,Fri Jan 26 2024 11:23:36 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-98,B,author_0,,,Thu Feb 08 2024 18:46:16 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-98,B,expert_47,,,Thu Sep 05 2024 13:50:45 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-98,B,expert_47,,,Mon Dec 09 2024 22:23:29 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-98,A,expert_2,,,Tue Apr 23 2024 18:37:48 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-98,A,expert_2,,,Tue Apr 09 2024 20:59:22 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-98,A,expert_41,,,Mon Jul 22 2024 04:39:56 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-98,A,expert_41,,,Wed Dec 04 2024 06:16:35 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-98,A,author_2,,,Sun Jul 14 2024 01:22:08 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-98,B,author_2,,,Tue Mar 12 2024 01:11:07 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-98,A,expert_1,,,Tue Jul 09 2024 00:19:49 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-98,B,expert_1,,,Fri Mar 08 2024 18:34:54 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-98,Tie,expert_22,,,Sat May 18 2024 02:14:28 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-98,A,expert_22,,,Sun Dec 08 2024 00:29:40 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-98,B,expert_44,,,Sat May 04 2024 06:56:54 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-98,B,expert_44,,,Mon Jul 08 2024 06:13:46 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-98,Tie,author_3,,,Mon Mar 04 2024 20:29:51 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-98,A,author_3,,,Sat Apr 06 2024 13:42:26 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-99,B,expert_17,,,Tue Jan 23 2024 15:02:02 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-99,B,expert_17,,,Wed Sep 04 2024 08:48:41 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-99,B,expert_19,,,Tue Oct 15 2024 21:34:05 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-99,B,expert_19,,,Tue Jan 23 2024 18:01:46 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-99,B,author_3,,,Mon Jan 01 2024 22:50:14 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-99,A,author_3,,,Fri Jul 19 2024 03:36:49 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-99,B,expert_24,,,Sun Nov 03 2024 19:25:23 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-99,Tie,expert_24,,,Sat Jun 22 2024 02:22:50 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-99,A,expert_36,,,Mon Nov 18 2024 13:31:31 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-99,B,expert_36,,,Wed Oct 09 2024 06:17:12 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-99,B,expert_46,,,Sun Nov 10 2024 17:10:46 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-99,A,expert_46,,,Mon Jul 22 2024 11:03:13 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-99,A,expert_5,,,Fri Jan 12 2024 08:47:38 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-99,B,expert_5,,,Tue Jan 23 2024 10:05:45 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-99,A,expert_42,,,Sun Oct 20 2024 17:06:21 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-99,A,expert_42,,,Sat Aug 10 2024 04:30:09 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-99,A,expert_4,,,Tue Jul 23 2024 04:25:47 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-99,A,expert_4,,,Tue Dec 17 2024 18:02:50 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-99,A,author_2,,,Fri Dec 13 2024 05:34:18 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-99,A,author_2,,,Sat Sep 28 2024 12:53:28 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-99,A,author_0,,,Thu Oct 03 2024 08:24:52 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-99,Tie,author_0,,,Thu Nov 07 2024 03:08:45 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-99,A,expert_24,,,Tue Feb 06 2024 20:45:03 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-99,Tie,expert_24,,,Sun Jul 14 2024 09:37:48 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-99,A,author_3,,,Thu Jan 25 2024 01:59:14 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-99,A,author_3,,,Fri Sep 27 2024 19:23:25 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-99,Tie,expert_11,,,Fri May 03 2024 01:26:02 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-99,A,expert_11,,,Tue Oct 22 2024 02:33:12 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-99,A,expert_51,,,Tue Apr 09 2024 08:11:19 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-99,A,expert_51,,,Sun Jun 02 2024 19:00:32 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-99,A,author_3,,,Fri Aug 16 2024 16:20:36 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-99,A,author_3,,,Fri Jun 14 2024 07:10:29 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-99,B,expert_22,,,Mon Jun 17 2024 03:18:52 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-99,B,expert_22,,,Sat Dec 21 2024 22:23:09 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-99,B,expert_27,,,Sun May 12 2024 01:57:41 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-99,B,expert_27,,,Tue Oct 08 2024 12:14:33 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-99,B,expert_28,,,Sun Jul 14 2024 18:35:36 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-99,B,expert_28,,,Tue Oct 22 2024 02:09:29 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-99,B,author_3,,,Sat Sep 21 2024 23:18:51 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-99,B,author_3,,,Wed Jun 12 2024 11:19:45 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-99,A,expert_21,,,Sat Aug 24 2024 03:49:00 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-99,A,expert_21,,,Wed Apr 24 2024 11:44:59 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-99,B,author_4,,,Sat Jan 20 2024 21:58:29 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-99,B,author_4,,,Sat Feb 17 2024 11:55:48 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-99,B,expert_42,,,Tue Dec 10 2024 11:18:45 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-99,B,expert_42,,,Sat Dec 28 2024 13:04:24 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-99,B,expert_50,,,Mon Jan 01 2024 22:08:41 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-99,B,expert_50,,,Thu Dec 12 2024 05:53:56 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-99,B,expert_42,,,Sat Apr 20 2024 02:55:52 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-99,B,expert_42,,,Mon Jun 17 2024 12:08:52 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-100,A,expert_14,,,Thu Mar 07 2024 02:19:35 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-100,A,expert_14,,,Sat May 18 2024 21:32:25 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-100,A,expert_6,,,Sat May 04 2024 04:45:51 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-100,A,expert_6,,,Sat Feb 03 2024 18:02:31 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-100,B,expert_13,,,Sat Jul 06 2024 15:47:03 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-100,A,expert_13,,,Thu Mar 21 2024 01:39:10 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-100,A,expert_41,,,Wed Jun 12 2024 12:24:12 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-100,Tie,expert_41,,,Sat Jun 22 2024 06:05:06 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-100,A,author_5,,,Wed Dec 25 2024 20:03:11 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-100,A,author_5,,,Sun Sep 08 2024 16:48:50 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-100,Tie,expert_35,,,Fri Aug 02 2024 11:23:25 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-100,A,expert_35,,,Sun Jul 07 2024 06:34:50 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-100,B,author_4,,,Sat Sep 14 2024 17:45:43 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-100,B,author_4,,,Wed Nov 13 2024 12:09:58 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-100,B,expert_0,,,Fri Aug 09 2024 03:23:07 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-100,B,expert_0,,,Fri Jul 19 2024 05:58:14 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-100,B,expert_44,,,Thu Apr 04 2024 00:50:28 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-100,B,expert_44,,,Sat Mar 09 2024 20:59:55 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-100,B,expert_9,,,Wed May 01 2024 21:58:48 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-100,B,expert_9,,,Fri Oct 11 2024 17:59:53 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-100,B,author_4,,,Fri Sep 06 2024 00:12:05 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-100,Tie,author_4,,,Wed Apr 10 2024 10:44:55 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-100,B,expert_24,,,Mon Sep 09 2024 07:56:53 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-100,A,expert_24,,,Wed Nov 06 2024 20:51:57 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-100,A,expert_24,,,Sun Jun 23 2024 07:53:20 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-100,A,expert_24,,,Thu Dec 26 2024 08:24:43 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-100,A,expert_26,,,Fri Jan 05 2024 21:10:26 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-100,A,expert_26,,,Sun May 26 2024 07:41:48 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-100,A,expert_28,,,Mon Jun 03 2024 08:28:42 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-100,A,author_4,,,Sun Sep 22 2024 19:52:09 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-100,A,author_4,,,Fri Jun 28 2024 01:28:26 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-100,B,expert_32,,,Tue Dec 24 2024 22:46:39 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-100,Tie,expert_32,,,Sat May 18 2024 02:21:51 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-100,B,expert_4,,,Wed Jun 05 2024 23:34:41 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-100,B,expert_4,,,Tue Sep 03 2024 07:32:17 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-100,B,expert_2,,,Thu Oct 24 2024 20:58:29 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-100,B,expert_2,,,Mon Apr 22 2024 02:55:13 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-100,B,expert_6,,,Thu Aug 01 2024 05:26:52 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-100,A,expert_6,,,Sun Aug 25 2024 08:07:49 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-100,B,expert_0,,,Tue Jan 16 2024 05:50:08 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-100,A,expert_0,,,Tue Jun 11 2024 05:38:01 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-100,B,expert_57,,,Mon Sep 16 2024 03:38:17 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-100,B,expert_57,,,Sat Aug 24 2024 09:20:41 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-100,B,expert_6,,,Tue Apr 16 2024 04:20:31 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-100,B,expert_6,,,Wed Dec 11 2024 02:20:36 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-100,A,author_2,,,Tue May 07 2024 14:45:46 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-100,A,author_2,,,Tue Dec 10 2024 12:05:04 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-100,A,expert_19,,,Fri Aug 16 2024 09:36:00 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-100,A,expert_19,,,Tue Feb 13 2024 06:53:11 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-100,Tie,author_4,,,Sun Mar 03 2024 11:28:43 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-100,Tie,author_4,,,Tue Apr 09 2024 07:59:41 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-100,Tie,author_6,,,Mon Apr 01 2024 11:23:35 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-100,Tie,author_6,,,Thu May 16 2024 09:26:38 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-100,B,expert_24,,,Fri Jun 14 2024 19:12:57 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-100,B,expert_24,,,Tue Mar 26 2024 22:24:31 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-100,A,expert_9,,,Sun Jun 09 2024 20:13:04 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-100,A,expert_9,,,Tue Mar 05 2024 01:02:05 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-101,B,author_4,,,Fri Feb 23 2024 19:00:10 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-101,Tie,author_4,,,Sat Jul 06 2024 06:27:32 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-101,A,expert_23,,,Thu Jul 25 2024 07:07:32 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-101,Tie,expert_23,,,Fri Dec 06 2024 19:08:22 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-101,Tie,author_4,,,Thu Nov 28 2024 05:40:06 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-101,B,author_4,,,Mon Apr 22 2024 23:00:08 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-101,Tie,expert_16,,,Mon Aug 26 2024 03:39:49 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-101,B,expert_16,,,Sat Apr 13 2024 23:16:34 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-101,B,expert_14,,,Sun Sep 22 2024 06:39:12 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-101,A,expert_14,,,Fri Jun 07 2024 21:12:08 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-101,A,expert_38,,,Fri Jul 12 2024 17:40:27 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-101,Tie,expert_38,,,Sun Oct 06 2024 22:42:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-101,Tie,expert_40,,,Thu May 23 2024 19:32:51 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-101,B,expert_40,,,Sat Jan 13 2024 20:28:36 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-101,B,expert_6,,,Mon Jun 24 2024 04:58:20 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-101,B,expert_6,,,Tue Aug 13 2024 05:02:53 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-101,A,author_3,,,Mon Aug 26 2024 05:56:55 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-101,A,author_3,,,Sun Sep 08 2024 23:51:50 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-101,Tie,author_2,,,Sat Aug 10 2024 20:00:48 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-101,A,author_2,,,Fri Apr 12 2024 05:12:51 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-101,Tie,expert_9,,,Thu Jul 18 2024 01:26:49 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-101,A,expert_9,,,Tue Feb 27 2024 18:16:10 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-101,A,expert_36,,,Sat Feb 24 2024 21:25:46 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-101,A,expert_36,,,Sat Jan 27 2024 07:18:06 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-101,A,expert_43,,,Mon May 06 2024 12:36:37 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-101,A,expert_43,,,Thu Jan 11 2024 07:11:30 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-101,B,expert_22,,,Thu May 23 2024 02:56:36 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-101,Tie,expert_22,,,Fri May 03 2024 12:38:40 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-101,B,expert_24,,,Mon Nov 04 2024 12:16:45 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-101,B,expert_24,,,Fri Jul 26 2024 14:59:59 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-101,B,expert_4,,,Sat Jun 22 2024 22:34:39 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-101,B,expert_4,,,Sat May 25 2024 13:57:52 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-101,A,expert_31,,,Wed Apr 03 2024 18:32:53 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-101,Tie,expert_31,,,Thu Mar 14 2024 22:02:12 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-101,Tie,expert_24,,,Sun Oct 27 2024 23:08:35 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-101,B,expert_24,,,Tue Jan 09 2024 21:44:17 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-101,Tie,expert_45,,,Sun Dec 15 2024 13:08:45 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-101,Tie,expert_45,,,Sat Jun 08 2024 09:12:57 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-101,Tie,expert_6,,,Sun Dec 08 2024 03:32:02 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-101,Tie,expert_6,,,Sun Aug 11 2024 02:43:36 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-102,B,expert_26,,,Fri Oct 04 2024 15:32:25 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-102,Tie,expert_26,,,Fri Sep 06 2024 20:20:27 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-102,B,expert_46,,,Sat Aug 17 2024 20:41:27 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-102,Tie,expert_46,,,Thu Mar 07 2024 13:29:52 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-102,B,expert_9,,,Tue May 28 2024 11:03:25 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-102,Tie,expert_9,,,Thu Jul 11 2024 12:26:07 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-102,B,expert_37,,,Sat Mar 16 2024 00:15:19 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-102,B,expert_37,,,Fri Jan 26 2024 20:15:31 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-102,A,expert_37,,,Mon Dec 16 2024 03:28:51 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-102,Tie,expert_37,,,Mon Apr 22 2024 10:06:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-102,A,author_4,,,Sat Jun 22 2024 07:49:06 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-102,Tie,author_4,,,Wed Jun 12 2024 00:24:14 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-102,A,expert_53,,,Fri Feb 16 2024 14:59:17 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-102,Tie,expert_53,,,Thu Oct 17 2024 02:42:28 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-102,B,expert_33,,,Tue Mar 12 2024 01:37:28 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-102,A,expert_33,,,Tue Jul 02 2024 03:10:41 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-102,A,expert_45,,,Thu Oct 17 2024 23:27:44 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-102,Tie,expert_45,,,Sun Dec 01 2024 09:00:25 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-102,Tie,expert_9,,,Fri May 17 2024 10:47:12 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-102,A,expert_9,,,Mon Mar 18 2024 09:13:50 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-102,Tie,expert_0,,,Thu Dec 26 2024 12:29:32 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-102,B,expert_0,,,Mon Oct 14 2024 10:24:39 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-102,Tie,expert_5,,,Wed Oct 09 2024 09:10:27 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-102,Tie,expert_5,,,Sat Jun 01 2024 18:43:07 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-102,A,expert_56,,,Tue May 28 2024 11:35:55 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-102,B,expert_56,,,Thu Feb 22 2024 05:13:08 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-102,Tie,expert_44,,,Sun Nov 03 2024 15:24:52 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-102,A,expert_44,,,Thu Jan 04 2024 15:00:54 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-102,Tie,expert_5,,,Mon Mar 11 2024 07:38:29 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-102,Tie,expert_5,,,Sun Jul 21 2024 04:40:34 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-102,B,expert_57,,,Tue Sep 03 2024 16:53:57 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-102,A,expert_57,,,Tue Jul 09 2024 15:23:44 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-103,B,expert_56,,,Sun May 05 2024 17:44:34 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-103,B,expert_56,,,Sun Jun 16 2024 11:58:08 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-103,B,expert_35,,,Fri Aug 16 2024 04:41:56 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-103,B,expert_35,,,Fri Jul 05 2024 21:58:18 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-103,A,expert_14,,,Fri Mar 01 2024 11:15:45 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-103,A,expert_14,,,Mon Jul 15 2024 09:50:38 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-103,A,expert_4,,,Wed Dec 25 2024 09:52:54 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-103,A,expert_4,,,Sat Aug 10 2024 00:50:03 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-103,A,author_3,,,Wed Sep 18 2024 18:04:59 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-103,A,author_3,,,Mon Oct 28 2024 04:58:26 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-103,A,expert_48,,,Mon Aug 05 2024 01:34:06 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-103,B,expert_48,,,Thu Mar 21 2024 05:43:51 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-103,A,expert_55,,,Sat Jan 06 2024 07:47:08 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-103,A,expert_55,,,Sun Jan 21 2024 02:09:45 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-103,B,author_4,,,Wed May 01 2024 13:43:02 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-103,B,author_4,,,Wed Sep 18 2024 07:25:34 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-103,B,author_4,,,Mon Jun 03 2024 08:26:28 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-103,B,author_4,,,Thu Oct 10 2024 06:50:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-103,B,expert_24,,,Mon Apr 01 2024 17:49:59 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-103,B,expert_24,,,Wed May 22 2024 07:41:08 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-103,B,expert_35,,,Sun Dec 15 2024 12:07:59 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-103,Tie,expert_35,,,Wed Apr 17 2024 11:59:09 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-103,A,expert_41,,,Sun Feb 18 2024 01:36:14 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-103,A,expert_41,,,Sat Nov 02 2024 08:51:45 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-103,Tie,expert_24,,,Tue Mar 12 2024 13:30:39 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-103,A,expert_24,,,Thu Oct 24 2024 14:25:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-103,Tie,expert_53,,,Thu Dec 05 2024 14:52:43 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-103,A,expert_53,,,Tue Sep 10 2024 02:41:17 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-103,A,expert_10,,,Wed Dec 25 2024 02:39:44 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-103,A,expert_10,,,Thu May 09 2024 15:25:55 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-103,A,expert_9,,,Tue Jan 23 2024 15:03:55 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-103,A,expert_9,,,Thu Mar 21 2024 20:40:35 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-103,A,expert_40,,,Thu Oct 24 2024 03:43:22 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-103,A,expert_40,,,Wed Oct 02 2024 14:25:01 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-103,B,expert_11,,,Sat Aug 10 2024 15:32:05 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-103,B,expert_11,,,Fri Sep 13 2024 01:59:54 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-103,B,expert_29,,,Sat Nov 09 2024 05:36:04 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-103,B,expert_29,,,Thu Jul 04 2024 09:53:38 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-103,B,author_3,,,Sun May 05 2024 03:55:29 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-103,B,author_3,,,Mon Jul 08 2024 00:04:55 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-103,B,expert_34,,,Sat Nov 09 2024 10:33:11 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-103,B,expert_34,,,Thu Mar 21 2024 11:23:58 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-103,B,author_2,,,Mon Oct 28 2024 03:44:01 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-103,B,author_2,,,Sun Feb 04 2024 01:05:13 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-103,Tie,expert_55,,,Wed Mar 06 2024 22:31:48 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-103,A,expert_55,,,Sun Jun 09 2024 06:42:05 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-103,B,expert_8,,,Fri Jun 07 2024 05:16:32 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-103,B,expert_8,,,Sat Dec 21 2024 09:26:02 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-103,Tie,author_4,,,Tue May 14 2024 10:39:30 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-103,B,author_4,,,Mon Apr 22 2024 19:11:04 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-103,B,expert_19,,,Sat Nov 16 2024 00:14:24 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-103,B,expert_19,,,Sat Dec 14 2024 10:39:59 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-103,A,expert_0,,,Wed Mar 13 2024 01:58:47 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-103,A,expert_0,,,Tue Jun 11 2024 08:32:10 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-104,Tie,author_4,,,Sat May 11 2024 03:40:22 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-104,B,author_4,,,Fri Jun 21 2024 22:49:58 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-104,Tie,expert_0,,,Sun Apr 28 2024 04:44:33 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-104,B,expert_0,,,Sun Oct 13 2024 04:23:41 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-104,Tie,expert_17,,,Wed Feb 07 2024 13:20:55 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-104,B,expert_17,,,Wed Jul 10 2024 14:25:38 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-104,Tie,expert_43,,,Fri Sep 27 2024 10:06:40 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-104,B,expert_43,,,Fri Jun 28 2024 21:56:42 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-104,Tie,expert_41,,,Sat Dec 21 2024 05:26:32 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-104,Tie,expert_41,,,Thu Nov 21 2024 12:53:26 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-104,Tie,expert_31,,,Sun Dec 01 2024 07:10:08 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-104,Tie,expert_31,,,Fri Mar 22 2024 14:09:51 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-104,Tie,expert_9,,,Thu Aug 08 2024 14:09:08 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-104,Tie,expert_9,,,Tue Jun 18 2024 01:33:01 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-104,A,expert_12,,,Sat Apr 06 2024 07:50:08 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-104,Tie,expert_12,,,Thu Jun 20 2024 01:01:06 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-104,A,expert_41,,,Tue Jun 18 2024 00:31:13 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-104,Tie,expert_41,,,Mon Oct 21 2024 02:29:53 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-104,Tie,expert_24,,,Fri Jul 26 2024 16:08:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-104,A,expert_24,,,Wed May 08 2024 21:30:44 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-104,B,expert_50,,,Wed Jan 10 2024 18:45:22 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-104,A,expert_50,,,Fri Sep 27 2024 13:40:54 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-104,Tie,author_0,,,Thu Jun 20 2024 19:23:41 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-104,A,author_0,,,Tue Apr 16 2024 14:39:52 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-104,A,author_4,,,Sat Nov 02 2024 10:28:01 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-104,A,author_4,,,Sun Feb 04 2024 20:45:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-104,Tie,expert_0,,,Mon Aug 19 2024 14:11:54 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-104,A,expert_0,,,Wed Apr 10 2024 04:51:02 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-104,Tie,expert_10,,,Sat Jun 08 2024 23:53:54 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-104,Tie,expert_10,,,Sun Mar 10 2024 05:27:25 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-104,Tie,expert_27,,,Sat Feb 17 2024 21:40:59 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-104,Tie,expert_27,,,Wed Jan 24 2024 11:00:46 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-104,Tie,expert_40,,,Thu Nov 14 2024 02:18:17 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-104,Tie,expert_40,,,Thu Apr 18 2024 03:18:39 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-104,Tie,author_4,,,Wed Feb 21 2024 06:14:40 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-104,B,author_4,,,Tue Sep 03 2024 18:38:43 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-104,Tie,expert_5,,,Fri Jun 07 2024 13:40:16 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-104,Tie,expert_5,,,Wed Apr 17 2024 14:57:37 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-104,B,expert_1,,,Mon Oct 07 2024 07:05:46 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-104,Tie,expert_1,,,Tue Apr 16 2024 17:56:31 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-104,B,expert_45,,,Sat May 18 2024 06:09:14 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-104,B,expert_45,,,Sat Nov 23 2024 08:28:30 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-104,Tie,expert_16,,,Sat Jun 22 2024 08:04:05 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-104,Tie,expert_16,,,Sun Apr 21 2024 02:13:12 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-104,B,expert_25,,,Thu Feb 15 2024 14:25:37 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-104,Tie,expert_25,,,Thu Feb 01 2024 03:08:21 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-104,Tie,expert_38,,,Sat Sep 07 2024 08:45:18 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-104,Tie,expert_38,,,Fri Jul 05 2024 06:39:09 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-105,Tie,expert_3,,,Sat Oct 05 2024 12:11:49 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-105,Tie,expert_3,,,Mon Dec 09 2024 00:05:57 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-105,Tie,expert_26,,,Tue Nov 19 2024 08:13:58 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-105,Tie,expert_26,,,Fri Oct 18 2024 18:20:08 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-105,Tie,expert_21,,,Fri Jul 12 2024 15:05:14 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-105,Tie,expert_21,,,Tue Apr 09 2024 07:42:39 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-105,Tie,expert_9,,,Fri Jul 26 2024 11:08:28 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-105,Tie,expert_9,,,Sat Oct 19 2024 23:17:27 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-105,Tie,expert_27,,,Thu Feb 08 2024 08:35:44 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-105,Tie,expert_27,,,Thu Jun 06 2024 18:15:50 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-105,Tie,expert_35,,,Fri Sep 06 2024 02:28:21 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-105,Tie,expert_35,,,Wed Jun 19 2024 23:06:39 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-105,Tie,author_0,,,Wed Sep 25 2024 00:39:41 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-105,Tie,author_0,,,Tue Dec 03 2024 10:41:42 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-105,Tie,author_3,,,Mon Feb 12 2024 15:25:16 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-105,Tie,author_3,,,Fri Feb 02 2024 05:29:53 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-105,Tie,author_4,,,Sun Apr 28 2024 18:58:33 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-105,Tie,author_4,,,Sun Mar 10 2024 20:56:56 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-105,B,expert_24,,,Tue Sep 03 2024 10:57:00 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-105,B,expert_24,,,Thu Aug 22 2024 06:30:34 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-105,Tie,expert_45,,,Fri Jul 19 2024 12:38:16 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-105,Tie,expert_45,,,Mon Aug 12 2024 01:59:47 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-105,Tie,author_4,,,Thu Jan 04 2024 04:46:21 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-105,Tie,author_4,,,Tue Jul 02 2024 05:04:51 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-105,Tie,author_4,,,Thu Dec 12 2024 10:14:38 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-105,Tie,author_4,,,Sat Jul 27 2024 07:00:08 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-105,Tie,expert_13,,,Wed Dec 11 2024 06:17:43 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-105,Tie,expert_13,,,Tue Oct 08 2024 11:33:18 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-105,Tie,author_3,,,Mon Apr 22 2024 14:11:24 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-105,Tie,author_3,,,Mon May 27 2024 17:12:42 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-105,Tie,expert_25,,,Tue Sep 10 2024 01:35:31 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-105,Tie,expert_25,,,Sun Dec 01 2024 09:22:24 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-105,Tie,expert_2,,,Thu May 02 2024 08:20:47 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-105,Tie,expert_2,,,Wed Sep 11 2024 22:00:02 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-105,Tie,expert_16,,,Wed Sep 11 2024 11:40:44 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-105,B,expert_16,,,Fri May 24 2024 15:10:12 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-105,Tie,expert_44,,,Thu Apr 18 2024 23:27:01 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-105,Tie,expert_44,,,Sat Oct 26 2024 01:42:14 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-105,Tie,expert_40,,,Fri Jun 14 2024 03:34:10 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-105,Tie,expert_40,,,Sun Jun 09 2024 17:08:47 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-105,Tie,author_0,,,Fri Apr 12 2024 14:05:34 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-105,Tie,author_0,,,Mon May 20 2024 15:10:49 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-106,B,expert_14,,,Wed Dec 25 2024 17:02:36 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-106,B,expert_14,,,Mon Sep 16 2024 23:28:30 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-106,Tie,expert_39,,,Sat Jul 27 2024 23:13:55 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-106,Tie,expert_39,,,Thu Sep 26 2024 14:02:29 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-106,Tie,expert_47,,,Mon Nov 18 2024 07:44:31 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-106,Tie,expert_47,,,Thu Jun 20 2024 18:50:57 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-106,A,expert_10,,,Fri Dec 13 2024 17:18:39 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-106,A,expert_10,,,Tue Feb 27 2024 23:06:46 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-106,A,expert_23,,,Sat Jun 15 2024 11:52:54 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-106,A,expert_23,,,Fri Apr 12 2024 03:15:32 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-106,A,expert_51,,,Tue Feb 13 2024 05:47:09 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-106,A,expert_51,,,Sat Nov 09 2024 11:24:52 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-106,Tie,expert_14,,,Tue Sep 17 2024 06:00:07 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-106,Tie,expert_14,,,Fri Apr 26 2024 00:59:33 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-106,B,expert_51,,,Fri Sep 20 2024 09:25:17 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-106,B,expert_51,,,Mon Jan 01 2024 17:14:15 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-106,B,author_0,,,Fri Mar 08 2024 02:56:14 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-106,B,author_0,,,Thu Mar 07 2024 15:50:56 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-106,Tie,expert_24,,,Sat Dec 21 2024 08:28:16 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-106,Tie,expert_24,,,Wed Jul 03 2024 16:58:24 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-106,Tie,expert_24,,,Fri Dec 06 2024 16:06:11 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-106,Tie,expert_24,,,Thu Apr 11 2024 09:52:39 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-106,Tie,expert_5,,,Tue Jan 09 2024 06:24:29 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-106,Tie,expert_5,,,Sat Jun 08 2024 17:49:46 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-106,B,expert_14,,,Fri Feb 02 2024 23:20:56 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-106,B,expert_14,,,Sun Dec 15 2024 09:18:20 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-106,A,expert_16,,,Thu Jun 13 2024 18:40:44 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-106,A,expert_16,,,Tue Sep 10 2024 19:59:26 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-106,Tie,expert_36,,,Wed Feb 14 2024 15:21:46 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-106,B,expert_36,,,Sun Feb 04 2024 09:06:23 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-106,B,expert_17,,,Thu Jun 13 2024 06:13:56 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-106,B,expert_17,,,Sun May 12 2024 09:48:43 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-106,B,expert_53,,,Wed Jun 19 2024 13:39:31 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-106,B,expert_53,,,Wed Jun 12 2024 00:29:04 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-106,B,expert_57,,,Thu Dec 26 2024 08:07:10 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-106,B,expert_57,,,Sat Nov 02 2024 21:31:40 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-106,Tie,author_0,,,Mon Jan 08 2024 21:02:58 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-106,Tie,author_0,,,Sun Jan 14 2024 11:47:07 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-106,Tie,expert_49,,,Sat Oct 05 2024 02:54:55 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-106,Tie,expert_49,,,Fri Oct 25 2024 00:58:12 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-106,B,expert_13,,,Sun Sep 22 2024 21:00:17 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-106,B,expert_13,,,Sat May 18 2024 15:31:51 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-106,B,expert_9,,,Thu Jun 06 2024 22:01:21 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-106,Tie,expert_53,,,Mon Jan 08 2024 15:20:38 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-106,Tie,expert_53,,,Tue Mar 05 2024 02:39:43 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-107,Tie,expert_15,,,Thu Nov 07 2024 17:38:49 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-107,A,expert_15,,,Mon Jun 03 2024 10:59:47 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-107,B,expert_22,,,Sun Dec 15 2024 15:53:42 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-107,A,expert_22,,,Wed Jun 26 2024 12:36:20 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-107,A,expert_10,,,Tue Sep 24 2024 23:32:39 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-107,A,expert_10,,,Sat Dec 21 2024 00:29:47 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-107,Tie,author_0,,,Tue May 07 2024 02:22:27 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-107,Tie,author_0,,,Thu Aug 15 2024 08:39:00 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-107,B,expert_14,,,Sun May 12 2024 09:17:36 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-107,A,expert_14,,,Tue Mar 19 2024 09:36:41 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-107,Tie,author_5,,,Tue May 14 2024 12:01:34 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-107,B,author_5,,,Tue Feb 27 2024 18:42:45 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-107,Tie,expert_24,,,Tue May 07 2024 07:56:16 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-107,Tie,expert_24,,,Mon Jan 22 2024 13:40:39 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-107,B,expert_50,,,Sun May 19 2024 01:55:57 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-107,B,expert_50,,,Sun Aug 11 2024 02:57:42 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-107,Tie,author_0,,,Wed Oct 16 2024 10:32:10 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-107,A,author_0,,,Wed Jun 19 2024 15:15:53 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-107,A,expert_44,,,Thu Jun 20 2024 13:53:02 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-107,B,expert_44,,,Thu Oct 24 2024 01:17:07 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-107,Tie,expert_31,,,Tue Sep 17 2024 16:35:47 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-107,A,expert_31,,,Tue Sep 17 2024 07:25:29 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-107,Tie,expert_24,,,Sat Jan 13 2024 21:07:59 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-107,Tie,expert_24,,,Thu Feb 15 2024 16:11:56 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-107,Tie,expert_6,,,Tue Mar 19 2024 18:21:09 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-107,B,expert_6,,,Sun Apr 14 2024 20:02:13 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-107,Tie,expert_36,,,Sun Dec 15 2024 06:08:00 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-107,Tie,expert_36,,,Sat Jan 27 2024 13:40:33 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-107,A,expert_1,,,Fri Nov 15 2024 06:10:45 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-107,A,expert_1,,,Mon Mar 25 2024 20:38:07 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-107,Tie,expert_39,,,Tue Mar 26 2024 04:18:46 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-107,Tie,author_2,,,Fri Feb 02 2024 05:08:07 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-107,A,author_2,,,Sat Feb 10 2024 10:39:28 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-107,Tie,expert_0,,,Mon Jan 01 2024 22:31:27 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-107,A,expert_0,,,Tue Jun 04 2024 04:07:12 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-108,Tie,expert_35,,,Tue Nov 12 2024 08:14:13 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-108,Tie,expert_35,,,Sat May 04 2024 12:17:17 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-108,A,expert_57,,,Tue Jun 11 2024 23:00:06 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-108,Tie,expert_57,,,Mon Mar 04 2024 16:10:27 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-108,Tie,author_2,,,Sun May 12 2024 00:41:04 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-108,B,author_2,,,Fri Aug 16 2024 20:06:32 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-108,Tie,expert_45,,,Wed Sep 25 2024 05:40:21 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-108,B,expert_45,,,Sun Jun 23 2024 22:14:01 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-108,Tie,expert_53,,,Wed Feb 14 2024 13:07:10 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-108,Tie,expert_53,,,Mon Jun 10 2024 07:58:13 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-108,Tie,author_2,,,Tue May 28 2024 12:13:05 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-108,Tie,author_2,,,Tue Mar 05 2024 01:06:18 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-108,Tie,expert_19,,,Tue Nov 26 2024 03:32:17 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-108,A,expert_19,,,Wed May 01 2024 02:24:13 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-108,A,expert_8,,,Tue Apr 02 2024 03:38:35 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-108,B,expert_8,,,Sun Feb 25 2024 14:32:00 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-108,Tie,expert_36,,,Tue Jul 09 2024 14:19:45 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-108,Tie,expert_36,,,Tue Aug 20 2024 08:56:29 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-108,B,expert_28,,,Fri Dec 06 2024 20:17:43 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-108,B,expert_28,,,Wed Jun 26 2024 23:30:56 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-108,Tie,author_4,,,Mon Nov 04 2024 02:02:19 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-108,Tie,author_4,,,Sun Oct 20 2024 11:45:36 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-108,Tie,expert_53,,,Mon Jun 10 2024 03:56:57 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-108,Tie,expert_53,,,Mon May 06 2024 09:47:40 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-108,A,expert_25,,,Mon Sep 09 2024 01:26:21 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-108,A,expert_25,,,Thu Dec 26 2024 06:31:12 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-108,A,expert_49,,,Thu Jul 04 2024 19:14:09 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-108,A,expert_49,,,Mon May 13 2024 06:44:47 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-108,A,author_4,,,Sun Jan 07 2024 18:44:38 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-108,A,author_4,,,Sat Aug 17 2024 13:18:29 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-108,A,expert_39,,,Sat Mar 23 2024 20:29:36 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-108,Tie,expert_39,,,Mon Aug 19 2024 11:04:07 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-108,A,expert_17,,,Thu Oct 10 2024 05:29:33 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-108,A,expert_17,,,Mon Jan 22 2024 05:18:18 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-108,A,author_0,,,Thu Apr 25 2024 09:42:59 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-108,Tie,author_0,,,Sat Jul 20 2024 20:57:32 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-108,Tie,expert_19,,,Tue Oct 15 2024 08:21:39 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-108,Tie,expert_19,,,Thu Jun 13 2024 21:00:21 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-108,Tie,expert_10,,,Tue Jan 16 2024 01:36:19 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-108,B,expert_10,,,Wed Feb 21 2024 20:22:19 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-108,Tie,expert_13,,,Mon Jan 15 2024 14:45:05 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-108,Tie,expert_13,,,Wed Mar 27 2024 17:55:13 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-108,B,expert_35,,,Wed Oct 02 2024 20:36:56 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-108,Tie,expert_35,,,Wed May 15 2024 18:09:20 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-108,Tie,expert_41,,,Tue Jan 09 2024 23:32:42 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-108,B,expert_41,,,Sun Jun 16 2024 09:46:53 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-109,A,expert_9,,,Sat Aug 24 2024 11:06:49 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-109,Tie,expert_9,,,Mon Sep 02 2024 16:13:07 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-109,A,author_0,,,Sun May 26 2024 09:22:13 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-109,Tie,author_0,,,Mon May 27 2024 16:40:11 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-109,A,expert_17,,,Fri Oct 18 2024 15:08:43 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-109,Tie,expert_17,,,Sat Oct 19 2024 11:06:22 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-109,A,expert_29,,,Wed Sep 04 2024 14:21:56 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-109,B,expert_29,,,Mon Feb 12 2024 20:05:43 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-109,Tie,expert_3,,,Mon Jul 22 2024 16:18:20 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-109,Tie,expert_3,,,Thu Jan 25 2024 13:31:23 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-109,B,expert_20,,,Mon Sep 02 2024 05:11:36 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-109,Tie,expert_20,,,Mon Sep 16 2024 03:50:00 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-109,Tie,author_4,,,Fri Jul 05 2024 03:40:24 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-109,Tie,author_4,,,Thu Dec 05 2024 07:41:54 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-109,Tie,expert_24,,,Tue Jul 09 2024 20:37:02 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-109,Tie,expert_24,,,Wed Nov 13 2024 19:55:24 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-109,Tie,author_3,,,Mon Jan 22 2024 14:03:28 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-109,Tie,author_3,,,Mon Feb 05 2024 07:53:24 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-109,A,expert_56,,,Wed May 22 2024 00:38:12 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-109,A,expert_56,,,Tue Jun 18 2024 06:24:52 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-109,B,author_4,,,Wed May 22 2024 10:42:34 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-109,Tie,author_4,,,Fri Apr 05 2024 18:44:45 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-109,B,expert_0,,,Tue Dec 10 2024 07:46:20 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-109,Tie,expert_0,,,Thu May 09 2024 08:02:16 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-109,A,expert_29,,,Fri Aug 23 2024 00:37:25 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-109,Tie,expert_29,,,Mon May 20 2024 11:11:22 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-109,B,expert_35,,,Mon Oct 14 2024 09:40:02 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-109,Tie,expert_35,,,Fri Oct 04 2024 19:37:32 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-109,Tie,expert_49,,,Thu Nov 28 2024 12:02:25 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-109,Tie,expert_49,,,Sat Jun 01 2024 06:03:09 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-109,A,expert_32,,,Tue May 28 2024 13:47:16 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-109,Tie,expert_32,,,Wed Aug 14 2024 21:10:43 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-109,B,expert_0,,,Fri Jan 19 2024 09:05:58 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-109,B,expert_0,,,Fri Feb 02 2024 10:44:14 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-109,Tie,expert_29,,,Wed Dec 25 2024 02:24:55 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-109,Tie,expert_29,,,Thu Jul 11 2024 08:08:15 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-109,B,expert_6,,,Wed Aug 28 2024 18:34:09 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-109,A,expert_6,,,Fri Apr 26 2024 03:51:32 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-109,A,expert_24,,,Sun Aug 25 2024 03:45:58 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-109,Tie,expert_24,,,Thu Nov 28 2024 11:43:20 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-109,A,expert_42,,,Tue Oct 08 2024 04:27:34 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-109,Tie,expert_42,,,Sat Aug 03 2024 19:28:28 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-109,A,expert_30,,,Mon Apr 22 2024 19:06:02 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-109,A,expert_30,,,Sat Jul 13 2024 18:12:02 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-110,B,expert_22,,,Tue May 07 2024 10:30:50 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-110,B,expert_22,,,Sat Mar 23 2024 19:09:23 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-110,A,expert_2,,,Fri Mar 22 2024 15:07:56 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-110,A,expert_2,,,Sun Aug 25 2024 11:22:40 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-110,A,expert_53,,,Fri Apr 19 2024 06:26:28 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-110,A,expert_53,,,Tue Jan 23 2024 21:57:30 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-110,Tie,expert_36,,,Fri Mar 15 2024 12:41:00 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-110,A,expert_36,,,Fri Oct 25 2024 18:31:09 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-110,A,expert_0,,,Fri Nov 08 2024 10:11:56 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-110,A,expert_0,,,Wed Jul 24 2024 05:54:17 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-110,A,expert_37,,,Sat Jul 06 2024 22:09:22 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-110,Tie,expert_37,,,Sat Aug 24 2024 12:27:27 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-110,Tie,author_4,,,Thu Mar 07 2024 21:28:09 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-110,B,author_4,,,Sun Dec 15 2024 05:33:16 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-110,Tie,expert_24,,,Sat May 04 2024 16:01:15 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-110,Tie,expert_24,,,Tue Mar 26 2024 06:18:47 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-110,Tie,expert_24,,,Wed Jan 10 2024 17:05:35 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-110,Tie,expert_24,,,Thu Oct 24 2024 06:54:47 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-110,A,expert_41,,,Sun Feb 04 2024 03:03:53 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-110,B,expert_41,,,Wed May 22 2024 20:15:19 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-110,A,expert_45,,,Mon Jul 22 2024 20:36:21 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-110,Tie,expert_45,,,Wed Jan 03 2024 07:34:02 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-110,Tie,expert_53,,,Thu Apr 11 2024 00:20:56 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-110,Tie,expert_53,,,Mon Nov 11 2024 09:28:54 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-110,Tie,author_3,,,Wed Apr 03 2024 16:20:37 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-110,A,author_3,,,Tue Dec 24 2024 10:49:54 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-110,B,expert_38,,,Sat Jul 20 2024 05:43:22 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-110,A,expert_38,,,Sun Dec 15 2024 15:30:06 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-110,A,expert_51,,,Fri Sep 20 2024 16:04:50 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-110,A,expert_51,,,Mon Oct 21 2024 04:47:48 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-110,B,expert_16,,,Thu Jan 18 2024 12:05:58 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-110,A,expert_16,,,Fri Dec 06 2024 18:46:34 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-110,Tie,expert_24,,,Sat Jul 13 2024 18:02:59 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-110,Tie,expert_24,,,Fri Jan 26 2024 17:59:34 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-110,B,expert_0,,,Sun Apr 07 2024 13:26:00 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-110,Tie,expert_0,,,Mon Oct 07 2024 04:40:18 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-110,Tie,expert_32,,,Tue Nov 19 2024 20:31:46 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-110,A,expert_32,,,Tue Jun 11 2024 23:09:12 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-110,Tie,author_5,,,Thu Jun 06 2024 04:33:48 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-110,B,author_5,,,Fri Apr 12 2024 04:28:20 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-110,A,expert_12,,,Thu May 16 2024 17:08:58 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-110,B,expert_12,,,Mon Oct 07 2024 06:24:39 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-110,Tie,expert_3,,,Fri Aug 23 2024 02:13:38 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-110,B,expert_3,,,Tue Nov 19 2024 08:52:04 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-110,A,expert_34,,,Wed Jun 26 2024 03:46:53 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-110,A,expert_34,,,Thu Sep 05 2024 00:28:44 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-110,B,expert_16,,,Fri Jan 05 2024 03:22:37 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-110,B,expert_16,,,Tue Aug 06 2024 14:22:28 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-111,Tie,expert_21,,,Sun Apr 28 2024 21:49:31 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-111,B,expert_21,,,Thu Sep 05 2024 12:49:47 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-111,Tie,expert_24,,,Sat May 04 2024 11:06:04 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-111,Tie,expert_24,,,Mon Mar 25 2024 10:28:33 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-111,B,expert_50,,,Sat Mar 16 2024 02:33:27 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-111,B,expert_50,,,Thu May 16 2024 01:08:35 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-111,Tie,author_3,,,Sun Nov 10 2024 08:34:50 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-111,Tie,author_3,,,Sun Jul 07 2024 18:48:31 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-111,A,expert_41,,,Fri Mar 01 2024 16:28:11 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-111,A,expert_41,,,Sun Jul 14 2024 07:29:31 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-111,Tie,author_3,,,Sun Mar 24 2024 09:02:06 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-111,Tie,author_3,,,Wed Jan 10 2024 04:02:42 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-111,B,expert_12,,,Fri Sep 20 2024 02:26:22 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-111,Tie,expert_12,,,Fri Mar 08 2024 21:18:19 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-111,Tie,expert_24,,,Sat Jun 01 2024 08:20:55 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-111,Tie,expert_24,,,Fri Feb 09 2024 03:07:22 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-111,A,expert_38,,,Fri Sep 13 2024 00:23:01 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-111,Tie,expert_38,,,Sun Jan 21 2024 21:42:19 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-111,A,expert_36,,,Tue Oct 08 2024 00:49:57 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-111,B,expert_36,,,Thu Sep 12 2024 06:36:40 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-111,A,expert_48,,,Sat Oct 19 2024 16:05:12 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-111,Tie,expert_48,,,Thu Jul 25 2024 13:16:19 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-111,A,expert_37,,,Mon Jun 17 2024 15:01:19 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-111,B,expert_37,,,Sun Aug 04 2024 22:28:44 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-111,B,author_2,,,Mon May 06 2024 09:15:23 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-111,B,author_2,,,Sun Feb 11 2024 10:51:09 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-111,B,expert_4,,,Tue Jun 11 2024 18:37:15 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-111,B,expert_4,,,Wed Oct 02 2024 17:41:21 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-111,B,expert_49,,,Sat Aug 03 2024 03:29:24 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-111,Tie,expert_49,,,Wed Jun 19 2024 01:16:59 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-111,A,expert_43,,,Sun Nov 10 2024 13:20:37 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-111,Tie,expert_43,,,Tue Jul 09 2024 05:47:03 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-111,B,author_3,,,Wed Dec 25 2024 18:51:17 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-111,Tie,author_3,,,Wed Apr 03 2024 23:03:31 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-112,B,expert_24,,,Mon Oct 14 2024 19:21:56 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-112,B,expert_24,,,Sun Aug 11 2024 19:10:44 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-112,B,expert_13,,,Mon Mar 04 2024 20:01:13 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-112,B,expert_13,,,Mon Feb 19 2024 03:24:10 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-112,A,author_3,,,Mon Nov 18 2024 01:32:51 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-112,A,author_3,,,Wed Dec 11 2024 09:18:19 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-112,A,expert_41,,,Thu Jan 11 2024 02:41:57 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-112,A,expert_41,,,Fri Feb 23 2024 20:51:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-112,A,author_3,,,Sun Jun 02 2024 08:47:22 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-112,A,author_3,,,Sat Aug 17 2024 06:27:05 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-112,A,expert_2,,,Sat Mar 02 2024 17:25:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-112,A,expert_2,,,Wed Oct 09 2024 18:48:53 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-112,Tie,author_4,,,Wed May 22 2024 16:30:29 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-112,B,author_4,,,Fri Jan 26 2024 16:39:04 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-112,Tie,expert_24,,,Mon Jan 08 2024 23:15:15 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-112,Tie,expert_24,,,Sun Aug 18 2024 17:44:43 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-112,A,expert_42,,,Sat May 18 2024 01:16:51 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-112,Tie,expert_42,,,Thu Oct 24 2024 01:32:07 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-112,A,expert_56,,,Sun May 26 2024 00:29:26 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-112,A,expert_56,,,Tue Apr 09 2024 14:50:32 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-112,A,expert_7,,,Mon Jul 22 2024 10:29:11 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-112,A,expert_7,,,Fri Sep 27 2024 18:19:34 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-112,A,expert_41,,,Mon Mar 25 2024 16:35:35 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-112,B,expert_41,,,Sat Sep 28 2024 23:51:08 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-112,A,expert_49,,,Mon Apr 08 2024 14:47:38 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-112,A,expert_49,,,Sat Jun 01 2024 09:23:29 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-112,Tie,author_6,,,Tue Sep 17 2024 11:27:12 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-112,Tie,author_6,,,Thu Mar 28 2024 12:08:05 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-112,B,expert_0,,,Tue Sep 17 2024 15:03:51 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-112,B,expert_0,,,Mon Jun 17 2024 17:42:22 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-112,B,expert_0,,,Thu May 23 2024 10:04:52 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-112,B,expert_0,,,Sun Apr 21 2024 19:30:59 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-112,B,expert_17,,,Mon Sep 09 2024 19:24:42 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-112,Tie,expert_17,,,Tue Mar 12 2024 22:24:22 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-112,B,expert_32,,,Tue Apr 16 2024 12:43:39 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-112,A,expert_32,,,Tue Jan 23 2024 06:33:33 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-112,B,expert_44,,,Tue Apr 09 2024 12:52:06 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-112,Tie,expert_44,,,Tue Dec 10 2024 10:15:30 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-112,B,expert_48,,,Fri Aug 16 2024 20:08:01 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-112,Tie,expert_48,,,Sun Sep 15 2024 08:41:11 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-112,A,expert_39,,,Mon Mar 18 2024 23:33:28 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-112,A,expert_39,,,Thu Nov 14 2024 08:05:55 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-112,Tie,author_2,,,Sun May 26 2024 13:19:31 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-112,B,author_2,,,Thu Aug 01 2024 14:54:17 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-112,B,expert_7,,,Sat Jun 15 2024 02:57:04 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-112,B,expert_7,,,Sat Apr 13 2024 22:46:47 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-112,A,author_6,,,Wed Aug 28 2024 15:28:56 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-112,Tie,author_6,,,Tue Feb 13 2024 09:23:00 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-112,A,expert_40,,,Wed May 01 2024 03:09:03 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-112,Tie,expert_40,,,Wed Jan 17 2024 22:01:19 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-113,B,author_0,,,Mon Feb 26 2024 02:29:55 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-113,B,author_0,,,Thu Apr 04 2024 23:01:31 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-113,Tie,expert_56,,,Thu Feb 01 2024 23:40:37 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-113,Tie,expert_56,,,Mon May 27 2024 09:38:44 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-113,Tie,expert_9,,,Sat Jul 20 2024 06:40:56 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-113,B,expert_9,,,Wed Feb 07 2024 02:14:29 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-113,A,expert_5,,,Fri Dec 13 2024 19:48:25 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-113,Tie,expert_5,,,Wed Jul 10 2024 10:46:22 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-113,A,expert_9,,,Sat Dec 14 2024 21:57:03 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-113,A,expert_9,,,Wed Jul 10 2024 09:08:07 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-113,Tie,expert_27,,,Fri Dec 27 2024 20:38:25 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-113,A,expert_27,,,Fri Nov 15 2024 19:22:58 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-113,B,expert_50,,,Sun Oct 27 2024 04:34:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-113,A,expert_50,,,Wed Apr 17 2024 06:55:56 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-113,Tie,author_2,,,Sat Feb 17 2024 10:53:42 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-113,A,author_2,,,Sun Apr 28 2024 17:27:19 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-113,B,expert_48,,,Fri Jul 12 2024 12:15:16 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-113,A,expert_48,,,Sun Dec 15 2024 17:12:15 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-113,A,author_0,,,Thu Nov 28 2024 11:35:42 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-113,A,author_0,,,Sat Jul 13 2024 04:38:18 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-113,A,expert_27,,,Tue Jul 09 2024 16:22:37 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-113,A,expert_27,,,Tue May 28 2024 01:06:51 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-113,A,author_0,,,Thu Dec 12 2024 09:05:02 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-113,A,author_0,,,Fri Aug 16 2024 15:09:13 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-113,A,expert_51,,,Fri Mar 01 2024 00:06:09 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-113,B,expert_51,,,Mon Jul 15 2024 19:31:02 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-113,A,expert_13,,,Fri May 10 2024 00:41:39 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-113,Tie,expert_13,,,Tue Apr 09 2024 08:50:46 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-113,A,expert_56,,,Thu Jul 04 2024 21:29:52 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-113,Tie,expert_56,,,Mon Aug 19 2024 08:12:11 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-113,Tie,expert_45,,,Mon Nov 11 2024 22:33:50 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-113,Tie,expert_45,,,Fri Dec 20 2024 09:21:58 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-113,B,expert_0,,,Mon Nov 04 2024 23:58:10 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-113,B,expert_0,,,Mon Apr 15 2024 16:32:36 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-113,B,expert_29,,,Sun Feb 25 2024 21:10:48 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-113,Tie,expert_29,,,Wed Aug 07 2024 13:39:49 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-113,B,expert_14,,,Mon Jan 15 2024 18:11:51 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-113,B,expert_14,,,Thu May 09 2024 07:16:18 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-113,B,expert_23,,,Thu Dec 05 2024 17:01:23 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-113,Tie,expert_23,,,Tue Apr 02 2024 08:21:52 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-114,B,expert_41,,,Fri Jan 26 2024 06:02:22 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-114,B,expert_41,,,Tue Mar 12 2024 19:56:48 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-114,B,expert_47,,,Thu Jan 25 2024 18:02:16 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-114,B,expert_47,,,Wed Aug 21 2024 21:36:16 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-114,Tie,expert_21,,,Tue Jun 11 2024 16:57:58 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-114,A,expert_21,,,Fri Aug 09 2024 23:53:46 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-114,A,expert_43,,,Mon Jan 01 2024 07:27:57 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-114,A,expert_43,,,Wed Apr 24 2024 16:43:45 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-114,B,expert_39,,,Mon Sep 09 2024 10:44:35 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-114,B,expert_39,,,Sat Dec 21 2024 14:56:37 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-114,A,expert_39,,,Sun Jun 09 2024 21:05:38 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-114,A,expert_39,,,Wed Mar 20 2024 18:13:45 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-114,Tie,author_0,,,Thu Feb 22 2024 04:55:16 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-114,Tie,author_0,,,Sun Mar 10 2024 14:48:07 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-114,A,author_4,,,Sat Jul 20 2024 07:02:50 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-114,A,author_4,,,Thu Jun 13 2024 02:23:43 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-114,Tie,expert_0,,,Thu May 02 2024 22:34:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-114,A,expert_0,,,Tue Sep 03 2024 07:04:50 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-114,A,expert_4,,,Sun Nov 10 2024 13:50:50 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-114,A,expert_4,,,Fri Mar 22 2024 23:17:31 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-114,Tie,expert_1,,,Wed Apr 03 2024 16:33:38 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-114,Tie,expert_1,,,Tue Apr 16 2024 09:58:56 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-114,A,expert_22,,,Fri Feb 23 2024 18:42:36 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-114,A,expert_22,,,Sat Mar 23 2024 11:36:10 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-114,A,expert_7,,,Thu Mar 28 2024 07:11:16 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-114,A,expert_7,,,Sat Jan 13 2024 00:34:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-114,B,expert_23,,,Thu Oct 24 2024 06:51:03 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-114,A,expert_23,,,Tue Mar 05 2024 21:17:47 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-114,A,expert_24,,,Thu Nov 07 2024 02:18:47 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-114,A,expert_24,,,Fri Jun 07 2024 18:54:21 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-114,Tie,expert_32,,,Fri Apr 19 2024 08:34:16 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-114,B,expert_32,,,Thu Jun 06 2024 23:01:31 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-114,Tie,expert_32,,,Fri May 24 2024 14:14:31 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-114,B,expert_32,,,Sat Jul 20 2024 16:21:24 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-114,B,expert_49,,,Mon Jan 15 2024 04:44:39 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-114,Tie,expert_49,,,Fri Oct 04 2024 06:02:11 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-114,Tie,expert_9,,,Thu Dec 05 2024 07:54:37 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-114,B,expert_9,,,Sat Mar 23 2024 18:10:58 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-114,Tie,expert_37,,,Fri Jan 26 2024 14:03:46 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-114,Tie,expert_37,,,Wed Jul 17 2024 19:10:26 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-115,Tie,author_2,,,Fri Nov 01 2024 06:57:51 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-115,Tie,author_2,,,Fri Jul 12 2024 21:15:18 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-115,B,author_0,,,Fri Oct 18 2024 01:39:07 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-115,B,author_0,,,Sat Jun 01 2024 15:09:04 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-115,Tie,expert_23,,,Sun Jan 21 2024 02:01:42 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-115,A,expert_23,,,Tue Jun 18 2024 20:07:51 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-115,Tie,expert_46,,,Wed Apr 10 2024 09:57:01 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-115,Tie,expert_46,,,Mon Mar 18 2024 03:38:59 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-115,B,expert_24,,,Sun Jun 16 2024 12:08:59 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-115,B,expert_24,,,Sat Aug 24 2024 20:23:58 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-115,B,expert_34,,,Thu Oct 03 2024 07:58:45 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-115,Tie,expert_34,,,Sat Sep 28 2024 17:06:24 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-115,Tie,expert_35,,,Fri Oct 11 2024 20:40:25 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-115,A,expert_35,,,Thu Jun 13 2024 11:49:23 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-115,A,expert_24,,,Wed Apr 03 2024 05:59:22 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-115,A,expert_24,,,Sat Jun 15 2024 16:42:23 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-115,A,author_0,,,Mon Oct 14 2024 10:31:55 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-115,A,author_0,,,Tue Nov 26 2024 14:19:42 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-115,A,author_2,,,Wed Apr 10 2024 06:55:07 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-115,A,author_2,,,Sat Sep 14 2024 17:51:42 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-115,A,expert_29,,,Mon Sep 23 2024 01:26:01 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-115,A,expert_29,,,Tue Feb 06 2024 03:25:56 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-115,A,expert_32,,,Wed May 22 2024 19:09:36 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-115,A,expert_32,,,Fri Jan 12 2024 19:00:19 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-115,A,expert_7,,,Wed Dec 18 2024 00:51:54 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-115,A,expert_7,,,Fri Jan 05 2024 03:20:44 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-115,A,author_0,,,Wed Jan 03 2024 12:11:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-115,A,author_0,,,Sun Oct 20 2024 04:23:24 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-115,A,expert_31,,,Sat Oct 19 2024 10:44:48 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-115,A,expert_31,,,Mon Feb 05 2024 15:36:55 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-115,Tie,expert_19,,,Sat Dec 21 2024 00:44:39 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-115,Tie,expert_19,,,Fri Jun 21 2024 04:25:59 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-115,B,expert_21,,,Sat Aug 17 2024 22:29:47 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-115,B,expert_21,,,Thu Jun 13 2024 09:43:58 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-115,Tie,expert_10,,,Tue Apr 16 2024 00:03:58 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-115,Tie,expert_10,,,Wed Nov 13 2024 17:13:44 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-115,Tie,expert_39,,,Mon Nov 18 2024 11:05:42 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-115,A,expert_39,,,Fri Aug 16 2024 05:48:00 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-115,Tie,expert_9,,,Sun Apr 14 2024 23:57:58 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-115,Tie,expert_9,,,Mon Apr 15 2024 04:55:25 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-115,B,expert_0,,,Fri Mar 08 2024 10:37:36 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-115,B,expert_0,,,Wed Jun 26 2024 21:22:52 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-115,B,expert_24,,,Sat Jun 08 2024 08:59:33 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-115,B,expert_24,,,Sun Oct 27 2024 02:03:52 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-115,A,expert_18,,,Sat Jan 20 2024 21:46:02 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-115,Tie,expert_18,,,Fri May 24 2024 19:49:39 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-116,B,expert_6,,,Sat Oct 12 2024 17:43:36 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-116,B,expert_6,,,Fri Oct 18 2024 18:03:41 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-116,B,expert_20,,,Fri Sep 27 2024 11:59:42 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-116,A,expert_20,,,Tue Nov 05 2024 07:18:15 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-116,A,expert_0,,,Wed Aug 28 2024 11:25:41 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-116,B,expert_39,,,Fri Jan 26 2024 17:40:48 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-116,B,expert_39,,,Tue May 14 2024 21:21:01 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-116,Tie,expert_53,,,Mon Mar 11 2024 10:17:47 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-116,Tie,expert_53,,,Sat Mar 09 2024 23:37:27 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-116,Tie,expert_55,,,Tue Dec 24 2024 08:57:48 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-116,Tie,expert_55,,,Fri Jan 05 2024 04:32:10 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-116,Tie,expert_9,,,Tue Oct 22 2024 15:40:58 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-116,Tie,expert_9,,,Sun Jun 02 2024 12:33:02 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-116,B,author_3,,,Sun Jul 28 2024 07:41:21 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-116,Tie,author_3,,,Sun Jun 16 2024 02:06:47 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-116,B,expert_24,,,Wed May 01 2024 21:04:45 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-116,Tie,expert_24,,,Wed Jul 10 2024 03:24:44 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-116,B,expert_31,,,Wed May 15 2024 00:32:12 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-116,B,expert_31,,,Sun Dec 15 2024 05:14:14 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-116,A,expert_14,,,Tue Jul 02 2024 17:04:18 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-116,A,expert_12,,,Thu Sep 19 2024 19:48:58 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-116,Tie,expert_12,,,Wed Jun 05 2024 22:34:48 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-116,A,expert_42,,,Fri Nov 22 2024 14:51:04 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-116,A,expert_42,,,Sat May 25 2024 09:05:33 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-116,Tie,author_2,,,Thu Jan 18 2024 10:40:58 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-116,Tie,author_2,,,Fri Nov 08 2024 02:43:09 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-116,B,author_3,,,Thu Nov 21 2024 17:14:30 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-116,Tie,author_3,,,Tue Nov 19 2024 11:08:32 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-116,B,author_4,,,Wed Jan 10 2024 22:58:02 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-116,B,author_4,,,Fri Jan 19 2024 05:07:02 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-116,B,expert_36,,,Sat May 25 2024 10:21:17 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-116,B,expert_36,,,Thu Nov 21 2024 20:07:41 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-116,B,expert_45,,,Tue Jul 23 2024 21:10:07 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-116,A,expert_45,,,Sun Jul 07 2024 02:19:47 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-116,Tie,expert_38,,,Tue Oct 15 2024 01:15:02 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-116,Tie,expert_38,,,Sat May 04 2024 10:03:35 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-116,Tie,expert_29,,,Tue Dec 10 2024 21:19:03 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-116,Tie,expert_29,,,Fri Apr 19 2024 13:17:51 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-116,A,expert_49,,,Tue Aug 27 2024 05:11:14 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-116,B,expert_49,,,Sun Apr 07 2024 10:37:24 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-117,B,expert_7,,,Sun Apr 07 2024 22:43:10 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-117,B,expert_7,,,Tue May 21 2024 17:37:32 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-117,Tie,expert_10,,,Mon Jan 15 2024 19:15:22 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-117,Tie,expert_10,,,Thu Dec 26 2024 21:16:42 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-117,Tie,expert_46,,,Tue Mar 05 2024 23:45:52 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-117,Tie,expert_46,,,Sat Nov 02 2024 20:00:25 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-117,B,expert_23,,,Tue Apr 23 2024 16:01:01 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-117,B,expert_23,,,Wed Sep 11 2024 00:20:05 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-117,B,expert_23,,,Sat Aug 03 2024 10:51:29 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-117,B,expert_23,,,Mon Feb 26 2024 05:30:40 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-117,B,expert_38,,,Mon May 20 2024 18:09:15 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-117,B,expert_38,,,Sat Dec 14 2024 12:05:40 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-117,A,author_2,,,Mon Sep 02 2024 03:14:26 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-117,Tie,author_2,,,Wed Aug 07 2024 05:51:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-117,A,author_4,,,Sun Nov 17 2024 19:52:58 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-117,A,author_4,,,Mon Apr 08 2024 14:56:25 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-117,A,expert_42,,,Sat Sep 21 2024 06:46:08 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-117,A,expert_42,,,Sun Aug 11 2024 09:17:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-117,Tie,author_4,,,Thu Oct 17 2024 12:33:21 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-117,A,author_4,,,Thu Mar 28 2024 16:13:46 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-117,Tie,expert_34,,,Tue Oct 08 2024 03:53:42 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-117,A,expert_34,,,Thu Aug 01 2024 23:27:31 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-117,B,author_4,,,Sun Oct 13 2024 18:58:44 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-117,B,author_4,,,Mon Dec 23 2024 11:22:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-117,B,expert_56,,,Mon Nov 18 2024 07:36:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-117,B,expert_56,,,Fri Apr 12 2024 20:55:44 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-117,A,expert_0,,,Fri Dec 13 2024 23:04:31 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-117,A,expert_0,,,Fri May 10 2024 10:42:27 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-117,A,expert_24,,,Wed May 22 2024 17:39:56 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-117,A,expert_24,,,Tue May 28 2024 00:45:47 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-117,A,expert_55,,,Tue Jul 09 2024 21:48:18 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-117,A,expert_55,,,Sun May 19 2024 22:14:24 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-117,A,author_0,,,Sun Jun 09 2024 07:31:33 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-117,A,author_0,,,Wed Mar 13 2024 04:23:30 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-117,A,expert_11,,,Sat May 11 2024 03:47:13 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-117,A,expert_11,,,Tue May 28 2024 08:45:12 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-117,B,expert_28,,,Mon Apr 08 2024 07:07:37 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-117,B,expert_28,,,Sun Jul 21 2024 09:53:53 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-117,B,expert_51,,,Thu Apr 04 2024 07:10:30 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-117,Tie,expert_51,,,Wed Jul 17 2024 13:05:54 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-117,B,expert_27,,,Sun Jul 28 2024 14:51:59 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-117,Tie,expert_27,,,Sun Jan 14 2024 16:33:14 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-117,Tie,expert_52,,,Tue Jun 25 2024 11:32:43 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-117,Tie,expert_52,,,Tue Feb 13 2024 21:47:42 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-117,B,author_0,,,Sat Nov 23 2024 08:47:21 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-117,B,author_0,,,Wed Dec 25 2024 05:01:57 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-117,B,expert_3,,,Mon Aug 12 2024 13:01:40 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-117,B,expert_3,,,Sat Jan 27 2024 14:57:34 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-117,B,expert_53,,,Sat Aug 10 2024 16:04:12 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-117,B,expert_53,,,Fri Aug 09 2024 09:45:06 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-118,B,author_0,,,Tue Apr 16 2024 22:03:17 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-118,Tie,author_0,,,Tue Oct 01 2024 02:46:54 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-118,A,author_4,,,Mon Oct 21 2024 06:05:27 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-118,Tie,author_4,,,Tue Jun 18 2024 01:20:27 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-118,A,expert_23,,,Thu Dec 26 2024 02:23:23 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-118,A,expert_23,,,Sat Dec 21 2024 20:04:21 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-118,A,expert_23,,,Mon Aug 12 2024 16:20:38 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-118,B,expert_23,,,Mon Apr 15 2024 14:31:04 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-118,A,author_4,,,Sun Nov 03 2024 02:39:17 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-118,A,author_4,,,Wed Nov 06 2024 18:38:13 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-118,A,author_4,,,Thu Jul 11 2024 02:45:13 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-118,Tie,author_4,,,Wed Sep 18 2024 07:50:42 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-118,A,expert_55,,,Thu Dec 12 2024 10:02:17 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-118,Tie,expert_55,,,Tue Jul 02 2024 18:09:55 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-118,A,expert_41,,,Sat Sep 14 2024 23:24:58 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-118,A,expert_41,,,Fri Jul 26 2024 02:26:18 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-118,Tie,expert_0,,,Sat May 04 2024 07:12:37 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-118,B,expert_0,,,Mon Sep 09 2024 02:54:54 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-118,Tie,author_6,,,Sun Mar 24 2024 23:22:12 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-118,Tie,author_6,,,Sun Oct 20 2024 22:29:54 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-118,Tie,expert_45,,,Sun Apr 14 2024 13:00:18 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-118,Tie,expert_45,,,Wed Jan 10 2024 19:59:41 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-118,A,expert_51,,,Tue Sep 24 2024 15:31:41 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-118,Tie,expert_51,,,Wed Dec 11 2024 16:43:03 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-118,Tie,expert_21,,,Sat Dec 21 2024 04:37:22 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-118,B,expert_21,,,Fri May 10 2024 09:09:53 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-118,Tie,expert_23,,,Wed Dec 11 2024 09:43:11 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-118,B,expert_23,,,Wed May 22 2024 02:39:10 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-118,B,expert_24,,,Fri May 10 2024 10:39:25 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-118,Tie,expert_24,,,Tue Feb 06 2024 03:27:05 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-118,Tie,expert_40,,,Sun Sep 08 2024 12:03:37 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-118,B,expert_40,,,Sun Nov 24 2024 11:34:04 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-118,Tie,expert_55,,,Fri Dec 13 2024 02:18:01 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-118,Tie,expert_55,,,Wed Nov 13 2024 23:34:25 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-118,B,expert_29,,,Thu Nov 07 2024 04:17:27 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-118,Tie,expert_29,,,Sat May 18 2024 07:02:21 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-118,A,expert_15,,,Mon May 27 2024 13:30:30 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-118,B,expert_15,,,Thu Jan 04 2024 05:09:32 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-119,B,author_4,,,Fri Jan 26 2024 00:22:28 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-119,B,author_4,,,Wed Feb 28 2024 19:20:45 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-119,B,expert_31,,,Tue Jun 04 2024 23:24:54 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-119,B,expert_31,,,Mon Apr 15 2024 01:44:23 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-119,B,expert_40,,,Wed Aug 14 2024 04:22:02 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-119,B,expert_40,,,Sun Jul 21 2024 07:59:40 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-119,Tie,expert_37,,,Thu Nov 14 2024 22:07:32 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-119,A,expert_37,,,Sun Oct 27 2024 00:26:10 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-119,A,author_2,,,Sun Dec 15 2024 00:13:49 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-119,A,author_2,,,Fri Jul 19 2024 12:51:59 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-119,A,expert_10,,,Thu Nov 21 2024 06:09:48 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-119,A,expert_10,,,Sun Jun 23 2024 04:56:51 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-119,B,author_0,,,Sat May 11 2024 22:03:13 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-119,Tie,author_0,,,Thu Mar 28 2024 06:45:02 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-119,A,expert_25,,,Sat Sep 28 2024 06:35:18 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-119,A,expert_25,,,Fri Mar 15 2024 06:56:57 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-119,A,expert_27,,,Wed Dec 04 2024 06:10:42 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-119,A,expert_27,,,Fri May 24 2024 12:30:17 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-119,B,expert_31,,,Sun Feb 18 2024 23:59:47 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-119,Tie,expert_31,,,Fri Mar 01 2024 00:51:30 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-119,A,expert_8,,,Fri Aug 16 2024 18:51:21 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-119,Tie,expert_8,,,Sun Sep 15 2024 00:52:26 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-119,Tie,expert_35,,,Thu Jul 18 2024 15:32:10 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-119,Tie,expert_35,,,Tue Jul 16 2024 09:40:16 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-119,B,author_0,,,Wed Nov 27 2024 19:08:08 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-119,B,author_0,,,Sat Feb 10 2024 18:01:08 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-119,B,expert_21,,,Mon Jul 22 2024 11:25:08 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-119,B,expert_21,,,Fri Sep 20 2024 11:53:05 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-119,B,expert_26,,,Wed Feb 07 2024 21:20:22 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-119,Tie,expert_26,,,Fri Sep 06 2024 09:12:31 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-119,B,expert_9,,,Sat Jun 08 2024 01:10:47 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-119,Tie,expert_9,,,Mon Jun 17 2024 11:13:40 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-119,Tie,expert_1,,,Mon Aug 19 2024 12:36:40 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-119,B,expert_1,,,Wed Apr 17 2024 01:19:22 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-119,Tie,expert_15,,,Wed May 01 2024 09:25:47 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-119,B,expert_15,,,Sat Feb 17 2024 20:28:32 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-119,A,expert_38,,,Tue Dec 03 2024 00:30:37 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-119,Tie,expert_38,,,Sat Apr 27 2024 21:55:23 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-120,Tie,author_2,,,Mon Mar 04 2024 18:51:30 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-120,Tie,author_2,,,Sun Jul 28 2024 08:56:01 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-120,Tie,expert_39,,,Thu Sep 12 2024 00:25:03 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-120,Tie,expert_39,,,Wed Sep 25 2024 22:58:38 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-120,A,expert_0,,,Sun Jun 23 2024 04:33:42 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-120,A,expert_0,,,Sat Jul 27 2024 01:33:13 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-120,A,author_0,,,Sun May 19 2024 00:40:16 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-120,Tie,author_0,,,Wed Feb 14 2024 16:16:55 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-120,A,expert_10,,,Wed Feb 21 2024 08:27:11 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-120,Tie,expert_10,,,Sat Nov 23 2024 06:54:01 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-120,Tie,expert_7,,,Sun Jul 28 2024 07:38:16 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-120,A,expert_7,,,Wed Mar 20 2024 04:23:31 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-120,B,expert_19,,,Sun Nov 17 2024 20:21:04 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-120,Tie,expert_19,,,Fri Apr 19 2024 23:11:35 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-120,B,expert_2,,,Thu Mar 14 2024 16:29:58 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-120,Tie,expert_2,,,Thu Nov 14 2024 15:51:13 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-120,B,expert_55,,,Mon Apr 22 2024 00:21:12 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-120,Tie,expert_55,,,Sun Aug 04 2024 11:36:46 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-120,A,expert_43,,,Sun Jan 07 2024 08:41:18 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-120,A,expert_43,,,Wed Apr 17 2024 02:05:42 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-120,Tie,expert_22,,,Tue Feb 06 2024 21:14:52 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-120,Tie,expert_22,,,Tue Sep 17 2024 06:01:57 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-120,B,expert_56,,,Sat Aug 10 2024 20:26:13 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-120,B,expert_56,,,Sat Jan 20 2024 09:58:21 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-120,B,expert_24,,,Thu Nov 07 2024 18:14:20 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-120,Tie,expert_24,,,Fri Jun 14 2024 16:38:26 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-120,B,expert_56,,,Wed Mar 13 2024 22:15:21 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-120,B,expert_56,,,Sat Oct 26 2024 01:46:09 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-120,B,expert_43,,,Wed Jul 17 2024 22:26:31 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-120,B,expert_43,,,Sun Apr 07 2024 09:34:15 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-120,B,expert_47,,,Sat Nov 09 2024 11:46:01 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-120,B,expert_47,,,Sat Aug 24 2024 13:35:13 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-120,Tie,expert_12,,,Sun Feb 11 2024 05:08:19 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-120,Tie,expert_12,,,Sun Apr 07 2024 03:36:09 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-120,A,expert_0,,,Fri Dec 06 2024 07:41:44 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-120,A,expert_0,,,Thu Dec 05 2024 23:56:12 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-121,B,expert_28,,,Wed Nov 20 2024 23:01:04 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-121,B,expert_28,,,Fri Jan 19 2024 23:12:47 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-121,B,expert_51,,,Fri Dec 20 2024 04:37:21 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-121,B,expert_51,,,Sat Aug 24 2024 03:08:24 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-121,B,expert_29,,,Sun Aug 18 2024 01:50:20 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-121,B,expert_29,,,Wed Dec 11 2024 04:16:23 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-121,B,expert_32,,,Tue Jun 04 2024 09:49:59 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-121,B,expert_32,,,Wed Mar 20 2024 19:15:35 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-121,Tie,expert_17,,,Tue Oct 22 2024 23:02:01 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-121,B,expert_17,,,Wed Jul 03 2024 11:31:17 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-121,A,expert_57,,,Sat Jan 20 2024 00:07:09 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-121,B,expert_57,,,Sat May 11 2024 18:13:33 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-121,A,author_5,,,Fri Sep 20 2024 05:56:29 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-121,A,author_5,,,Fri Jan 19 2024 20:23:01 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-121,Tie,author_3,,,Wed Oct 02 2024 19:24:50 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-121,B,author_3,,,Sun Mar 24 2024 15:37:36 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-121,A,expert_7,,,Sat Dec 07 2024 11:38:37 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-121,A,expert_7,,,Fri Jan 26 2024 01:06:22 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-121,Tie,expert_0,,,Thu Apr 11 2024 16:59:40 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-121,Tie,expert_0,,,Thu Jan 25 2024 03:09:43 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-121,B,expert_57,,,Mon Nov 18 2024 00:34:44 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-121,A,expert_57,,,Sat Jul 13 2024 01:31:22 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-121,A,expert_8,,,Sun Sep 01 2024 21:13:11 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-121,A,expert_8,,,Sun Jun 23 2024 06:14:15 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-121,B,expert_28,,,Wed Dec 18 2024 10:53:51 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-121,B,expert_28,,,Thu Jul 11 2024 19:36:08 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-121,B,expert_48,,,Thu Oct 03 2024 16:51:26 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-121,B,expert_48,,,Mon Jun 24 2024 02:11:06 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-121,B,expert_9,,,Sat Dec 07 2024 21:31:01 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-121,B,expert_9,,,Fri Oct 25 2024 19:20:30 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-121,Tie,author_6,,,Sun Nov 17 2024 08:27:32 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-121,A,author_6,,,Sun Mar 24 2024 01:13:21 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-121,B,expert_0,,,Wed Aug 14 2024 11:03:50 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-121,B,expert_4,,,Fri Aug 23 2024 07:44:22 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-121,B,expert_4,,,Thu Sep 05 2024 20:37:27 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-121,A,expert_32,,,Wed Oct 23 2024 04:23:27 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-121,A,expert_32,,,Wed Jun 26 2024 00:14:24 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-121,A,expert_50,,,Mon Nov 18 2024 00:26:21 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-121,A,expert_50,,,Mon Mar 18 2024 03:12:21 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-122,B,author_4,,,Mon Sep 02 2024 01:29:20 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-122,B,author_4,,,Wed Feb 14 2024 02:59:44 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-122,A,expert_55,,,Sun Sep 08 2024 13:17:17 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-122,Tie,expert_55,,,Mon Nov 04 2024 10:19:13 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-122,Tie,author_5,,,Mon Oct 21 2024 08:56:51 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-122,A,author_5,,,Fri Feb 23 2024 06:06:20 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-122,Tie,expert_43,,,Sun May 12 2024 17:06:01 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-122,Tie,expert_43,,,Sat Jun 15 2024 03:34:57 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-122,Tie,expert_1,,,Mon Feb 19 2024 11:46:00 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-122,A,expert_1,,,Sat Aug 17 2024 07:09:15 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-122,Tie,expert_24,,,Sun Nov 10 2024 07:06:37 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-122,Tie,expert_24,,,Wed Apr 10 2024 01:27:07 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-122,A,expert_48,,,Mon Jul 22 2024 22:54:19 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-122,B,expert_48,,,Tue Apr 23 2024 20:37:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-122,Tie,author_2,,,Sat Oct 12 2024 23:43:41 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-122,A,author_2,,,Mon May 27 2024 03:51:24 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-122,B,expert_48,,,Wed Apr 17 2024 02:26:33 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-122,A,expert_48,,,Sat Dec 28 2024 04:17:44 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-122,A,expert_8,,,Sat Sep 14 2024 01:28:17 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-122,B,expert_8,,,Thu Mar 07 2024 02:36:49 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-122,A,expert_0,,,Sun Oct 06 2024 03:02:33 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-122,A,expert_0,,,Sun Jun 16 2024 00:33:06 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-122,B,author_0,,,Mon Oct 14 2024 09:35:40 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-122,B,author_0,,,Thu Jul 04 2024 11:46:52 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-122,B,expert_13,,,Sat Jun 01 2024 22:42:56 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-122,Tie,expert_13,,,Fri Sep 27 2024 20:39:15 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-122,B,expert_9,,,Thu Dec 19 2024 23:10:25 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-122,Tie,expert_9,,,Thu Sep 19 2024 02:06:28 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-122,B,expert_56,,,Thu Jul 25 2024 16:11:36 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-122,B,expert_56,,,Thu Apr 04 2024 21:38:10 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-122,Tie,expert_24,,,Mon Aug 19 2024 01:26:21 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-122,B,expert_0,,,Wed Nov 13 2024 15:52:39 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-122,B,expert_0,,,Sun Jan 14 2024 10:35:13 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-122,B,expert_20,,,Mon Dec 16 2024 07:09:03 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-122,B,expert_20,,,Sat Jun 22 2024 02:51:56 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-122,A,expert_35,,,Thu Feb 22 2024 04:55:03 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-122,A,expert_35,,,Wed Jan 17 2024 03:26:16 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-123,B,author_0,,,Wed Mar 13 2024 13:56:01 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-123,B,author_0,,,Sun Jul 28 2024 20:09:23 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-123,B,expert_48,,,Sat Jan 13 2024 05:52:22 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-123,B,expert_48,,,Thu Jun 06 2024 21:09:41 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-123,A,expert_48,,,Wed Feb 21 2024 20:53:43 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-123,B,expert_48,,,Fri Sep 06 2024 08:31:42 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-123,A,expert_28,,,Fri Nov 22 2024 16:47:11 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-123,A,expert_28,,,Sat Jan 27 2024 05:37:02 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-123,B,expert_32,,,Tue Apr 09 2024 03:12:54 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-123,B,expert_32,,,Fri Oct 04 2024 18:07:28 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-123,B,expert_7,,,Sun Sep 01 2024 09:31:42 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-123,B,expert_7,,,Wed Dec 18 2024 04:58:12 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-123,A,expert_1,,,Thu Nov 14 2024 00:47:38 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-123,B,expert_1,,,Sun Aug 25 2024 23:27:18 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-123,A,expert_47,,,Fri Dec 27 2024 19:19:41 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-123,A,expert_47,,,Wed Feb 28 2024 01:18:53 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-123,A,expert_36,,,Fri Nov 22 2024 10:53:19 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-123,A,expert_36,,,Tue Sep 17 2024 13:02:19 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-123,A,expert_44,,,Sat Dec 28 2024 19:29:59 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-123,A,expert_44,,,Wed Mar 13 2024 05:13:07 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-123,Tie,author_4,,,Sun Dec 15 2024 08:06:31 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-123,Tie,author_4,,,Thu Jul 18 2024 22:39:37 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-123,B,expert_44,,,Sat Apr 06 2024 08:16:38 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-123,B,expert_44,,,Wed Aug 21 2024 02:53:44 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-123,Tie,expert_17,,,Mon Oct 14 2024 10:25:41 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-123,Tie,expert_17,,,Wed Aug 21 2024 17:24:11 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-123,Tie,expert_24,,,Sat Dec 07 2024 09:18:28 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-123,Tie,expert_24,,,Sat May 11 2024 11:10:07 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-123,A,expert_34,,,Mon Nov 04 2024 15:09:28 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-123,Tie,expert_34,,,Sun Jun 23 2024 17:42:24 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-123,Tie,expert_38,,,Mon Oct 21 2024 13:04:48 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-123,Tie,expert_38,,,Wed Mar 06 2024 11:48:11 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-123,Tie,author_4,,,Tue Nov 19 2024 02:30:40 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-123,A,author_4,,,Mon Sep 02 2024 14:30:54 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-123,Tie,expert_24,,,Mon Jul 15 2024 12:01:00 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-123,Tie,expert_24,,,Wed Apr 10 2024 17:29:15 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-123,A,expert_3,,,Fri May 17 2024 14:51:25 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-123,A,expert_3,,,Wed Aug 07 2024 03:23:56 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-123,Tie,expert_25,,,Sun Sep 01 2024 02:33:29 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-123,A,expert_25,,,Tue Jan 02 2024 13:58:43 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-123,Tie,expert_21,,,Sat Jul 06 2024 06:48:47 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-123,B,expert_21,,,Mon Aug 26 2024 00:32:22 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-123,B,expert_41,,,Mon Nov 04 2024 10:14:43 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-123,B,expert_41,,,Fri Nov 08 2024 17:00:55 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-123,B,author_4,,,Fri Apr 05 2024 22:41:44 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-123,B,author_4,,,Tue Nov 19 2024 03:24:26 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-123,B,author_3,,,Sat Apr 20 2024 19:56:56 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-123,Tie,author_3,,,Sun Apr 14 2024 23:01:09 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-123,B,expert_0,,,Thu Mar 21 2024 09:26:51 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-123,B,expert_0,,,Fri Jul 26 2024 22:28:02 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-123,B,expert_22,,,Wed Feb 07 2024 03:32:44 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-123,B,expert_22,,,Sat Nov 23 2024 05:38:45 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-123,A,expert_40,,,Fri Aug 02 2024 03:20:10 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-123,A,expert_40,,,Sat Oct 05 2024 19:12:15 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-123,A,expert_25,,,Mon Aug 05 2024 05:35:59 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-123,A,expert_25,,,Thu May 16 2024 15:55:28 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-124,A,expert_48,,,Fri Mar 15 2024 17:56:43 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-124,B,expert_48,,,Tue May 21 2024 06:47:25 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-124,A,expert_40,,,Wed Jul 24 2024 12:44:55 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-124,Tie,expert_40,,,Wed Sep 04 2024 21:56:23 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-124,B,expert_24,,,Thu Jan 11 2024 08:00:07 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-124,A,expert_24,,,Tue Jan 02 2024 12:21:24 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-124,B,expert_51,,,Tue Apr 23 2024 20:24:28 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-124,B,expert_51,,,Fri Jan 26 2024 21:52:57 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-124,B,expert_7,,,Wed Dec 11 2024 19:41:24 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-124,A,expert_7,,,Sat Jun 08 2024 01:04:25 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-124,B,expert_4,,,Tue May 28 2024 08:10:19 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-124,A,expert_4,,,Wed Aug 07 2024 09:08:10 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-124,B,expert_12,,,Wed Dec 04 2024 16:11:27 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-124,A,expert_12,,,Sat Dec 21 2024 13:17:43 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-124,A,expert_49,,,Mon Oct 28 2024 10:50:34 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-124,B,expert_49,,,Sat Jul 06 2024 16:31:56 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-124,Tie,author_3,,,Thu Dec 19 2024 15:31:29 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-124,A,author_3,,,Fri Jun 21 2024 04:16:09 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-124,Tie,expert_24,,,Sat Dec 21 2024 00:08:54 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-124,A,expert_24,,,Sun Jun 16 2024 01:00:18 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-124,B,expert_45,,,Fri Aug 02 2024 10:52:35 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-124,Tie,expert_45,,,Sat Apr 27 2024 00:39:37 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-124,Tie,expert_0,,,Thu Aug 22 2024 17:25:16 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-124,Tie,expert_0,,,Sun Jul 14 2024 11:27:16 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-124,Tie,expert_53,,,Fri Oct 25 2024 01:15:15 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-124,B,expert_53,,,Tue Nov 12 2024 22:02:25 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-124,Tie,expert_26,,,Mon Apr 08 2024 23:52:42 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-124,B,expert_26,,,Thu Oct 17 2024 05:16:20 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-124,Tie,expert_8,,,Tue Dec 24 2024 01:45:22 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-124,B,expert_8,,,Mon Feb 26 2024 07:14:30 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-124,B,author_4,,,Sat Apr 27 2024 03:12:28 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-124,B,author_4,,,Thu Sep 05 2024 01:53:53 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-124,Tie,expert_57,,,Wed May 22 2024 10:45:15 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-124,B,expert_57,,,Tue Feb 06 2024 01:57:39 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-124,B,expert_5,,,Fri Aug 23 2024 06:45:15 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-124,A,expert_5,,,Mon Oct 07 2024 10:11:56 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-124,Tie,expert_11,,,Thu Jun 06 2024 22:38:18 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-124,B,expert_11,,,Mon Apr 22 2024 10:32:35 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-124,Tie,expert_54,,,Wed Apr 24 2024 19:10:26 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-124,B,expert_54,,,Fri Aug 16 2024 05:06:05 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-124,A,expert_33,,,Wed Jan 24 2024 10:09:11 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-124,A,expert_33,,,Tue Sep 03 2024 02:40:57 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-125,B,expert_47,,,Sat Jun 22 2024 05:02:23 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-125,B,expert_47,,,Fri Nov 22 2024 01:05:33 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-125,B,expert_38,,,Sun Jun 16 2024 00:40:51 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-125,B,expert_38,,,Sun Dec 15 2024 20:24:10 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-125,A,expert_0,,,Wed Mar 13 2024 08:05:16 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-125,A,expert_0,,,Sat Oct 05 2024 08:11:47 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-125,Tie,expert_24,,,Mon Nov 25 2024 00:21:06 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-125,Tie,expert_24,,,Sat Nov 02 2024 02:19:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-125,B,author_4,,,Mon Sep 09 2024 02:53:03 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-125,A,author_4,,,Wed Jan 03 2024 00:53:09 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-125,Tie,expert_9,,,Sun Jun 02 2024 18:51:52 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-125,Tie,expert_9,,,Thu Mar 21 2024 04:07:01 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-125,A,author_5,,,Wed Sep 25 2024 17:35:23 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-125,A,author_5,,,Fri Mar 01 2024 12:13:47 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-125,Tie,expert_34,,,Fri Jun 21 2024 04:51:02 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-125,Tie,expert_34,,,Fri Nov 15 2024 21:20:25 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-125,Tie,expert_2,,,Fri Jun 28 2024 07:05:35 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-125,Tie,expert_2,,,Wed Nov 06 2024 17:49:34 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-125,Tie,expert_24,,,Sat Mar 16 2024 04:25:23 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-125,Tie,expert_24,,,Fri Jul 12 2024 23:05:18 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-125,Tie,author_2,,,Mon Feb 12 2024 05:24:47 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-125,Tie,author_2,,,Mon Oct 07 2024 19:06:50 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-125,A,expert_31,,,Mon Aug 19 2024 12:59:29 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-125,B,expert_31,,,Sun Mar 24 2024 07:54:54 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-125,B,expert_49,,,Fri May 10 2024 05:21:44 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-125,B,expert_49,,,Mon May 13 2024 11:00:48 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-125,B,author_5,,,Wed Sep 18 2024 07:37:21 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-125,B,author_5,,,Sat Dec 21 2024 18:02:26 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-125,B,expert_5,,,Thu Aug 08 2024 08:11:54 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-125,B,expert_5,,,Mon Aug 19 2024 21:31:58 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-125,Tie,expert_9,,,Sat Oct 26 2024 07:14:51 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-125,Tie,expert_9,,,Fri Apr 05 2024 13:44:13 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-126,A,expert_16,,,Fri May 03 2024 21:05:59 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-126,A,expert_16,,,Sun Apr 14 2024 01:34:46 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-126,B,expert_42,,,Thu May 23 2024 07:12:13 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-126,A,expert_42,,,Sun Feb 04 2024 01:33:51 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-126,A,expert_8,,,Sun Apr 28 2024 10:08:37 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-126,A,expert_8,,,Tue May 28 2024 21:00:07 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-126,A,expert_20,,,Tue Oct 22 2024 16:41:48 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-126,B,expert_20,,,Sun Sep 08 2024 06:44:03 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-126,A,expert_36,,,Wed Jul 03 2024 07:44:50 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-126,A,expert_36,,,Sun Oct 13 2024 09:40:48 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-126,B,author_4,,,Mon Aug 26 2024 07:36:34 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-126,A,author_4,,,Sun Feb 11 2024 04:08:15 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-126,B,expert_51,,,Sat Oct 19 2024 18:00:52 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-126,A,expert_51,,,Tue Nov 05 2024 06:48:36 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-126,Tie,expert_49,,,Tue Sep 24 2024 09:01:19 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-126,B,expert_49,,,Mon Mar 11 2024 09:10:16 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-126,B,author_0,,,Sun Apr 28 2024 23:59:35 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-126,B,author_0,,,Thu Dec 26 2024 13:55:49 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-126,B,expert_0,,,Wed Mar 27 2024 13:19:39 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-126,A,expert_0,,,Sun May 19 2024 19:37:26 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-126,B,expert_2,,,Sun Nov 17 2024 10:29:12 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-126,B,expert_2,,,Tue Jun 18 2024 23:40:32 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-126,Tie,author_3,,,Mon Nov 18 2024 03:21:23 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-126,Tie,author_3,,,Tue May 14 2024 15:40:16 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-126,A,expert_32,,,Sun Feb 18 2024 22:13:40 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-126,B,expert_32,,,Sat May 11 2024 15:24:44 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-126,Tie,expert_53,,,Tue Feb 06 2024 13:17:31 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-126,B,expert_53,,,Wed Jun 19 2024 19:40:54 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-126,B,expert_24,,,Tue May 14 2024 11:40:22 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-126,A,expert_24,,,Thu Jun 20 2024 05:13:34 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-127,B,expert_33,,,Wed Jan 17 2024 19:13:58 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-127,B,expert_33,,,Sat Jan 27 2024 23:07:31 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-127,B,expert_9,,,Sat Sep 07 2024 05:24:31 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-127,Tie,expert_9,,,Wed Jul 03 2024 22:15:00 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-127,A,expert_25,,,Sun May 12 2024 02:23:35 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-127,A,expert_25,,,Tue Feb 13 2024 10:55:12 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-127,Tie,author_2,,,Thu Nov 28 2024 18:53:34 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-127,Tie,author_2,,,Tue Dec 10 2024 06:51:10 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-127,A,expert_35,,,Tue Jun 18 2024 22:50:25 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-127,A,expert_35,,,Tue Dec 24 2024 19:38:21 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-127,A,expert_55,,,Sat Dec 14 2024 19:07:17 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-127,A,expert_55,,,Sat Mar 16 2024 06:15:46 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-127,A,expert_24,,,Mon Mar 11 2024 21:44:18 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-127,Tie,expert_24,,,Wed May 08 2024 22:00:39 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-127,Tie,expert_24,,,Mon Nov 25 2024 09:11:23 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-127,Tie,expert_24,,,Wed Oct 09 2024 00:57:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-127,A,expert_19,,,Fri Feb 02 2024 08:54:44 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-127,Tie,expert_19,,,Fri Aug 02 2024 02:13:25 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-127,A,expert_31,,,Mon Jul 15 2024 22:28:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-127,Tie,expert_31,,,Sat Jan 06 2024 18:20:22 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-127,A,expert_2,,,Tue Sep 24 2024 22:06:09 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-127,A,expert_2,,,Tue May 07 2024 11:53:58 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-127,A,expert_50,,,Mon Jan 22 2024 19:24:11 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-127,Tie,expert_50,,,Mon Nov 04 2024 13:54:02 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-127,B,author_0,,,Thu May 02 2024 04:51:29 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-127,Tie,author_0,,,Thu Mar 28 2024 18:28:26 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-127,A,expert_42,,,Wed Dec 11 2024 20:11:16 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-127,A,expert_42,,,Tue Mar 19 2024 14:11:03 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-127,A,expert_44,,,Sun Aug 11 2024 23:25:41 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-127,A,expert_44,,,Sat Sep 07 2024 04:11:59 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-127,A,expert_28,,,Mon Dec 16 2024 00:43:12 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-127,B,expert_28,,,Fri May 17 2024 00:38:36 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-127,B,expert_32,,,Fri Dec 13 2024 13:27:32 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-127,B,expert_32,,,Fri Nov 01 2024 20:31:12 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-127,B,expert_9,,,Thu Jan 04 2024 15:22:45 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-127,B,expert_9,,,Wed Jul 17 2024 21:53:17 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-127,B,expert_3,,,Sat May 04 2024 16:53:10 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-127,B,expert_3,,,Sat May 11 2024 15:50:50 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-127,B,expert_44,,,Fri Jan 19 2024 02:21:09 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-127,B,expert_44,,,Mon Jun 10 2024 19:22:34 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-127,B,author_0,,,Sat Aug 24 2024 19:44:58 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-127,Tie,author_0,,,Sun Jan 07 2024 19:02:12 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-127,A,expert_46,,,Mon Jul 01 2024 04:51:42 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-127,A,expert_46,,,Tue Sep 03 2024 09:50:10 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-128,B,expert_6,,,Wed Jul 03 2024 02:17:54 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-128,Tie,expert_6,,,Wed Sep 18 2024 10:02:37 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-128,Tie,author_0,,,Thu Jun 27 2024 15:01:07 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-128,Tie,expert_33,,,Mon Jul 15 2024 12:31:52 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-128,Tie,expert_33,,,Fri Feb 16 2024 18:59:19 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-128,Tie,author_0,,,Tue Dec 24 2024 18:44:43 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-128,B,author_0,,,Sat Sep 28 2024 03:16:56 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-128,A,expert_17,,,Thu Mar 07 2024 10:44:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-128,A,expert_17,,,Fri Oct 04 2024 19:00:24 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-128,A,expert_24,,,Mon Mar 11 2024 19:01:46 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-128,A,expert_24,,,Fri Dec 13 2024 12:54:18 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-128,A,author_3,,,Thu Feb 22 2024 19:59:34 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-128,A,author_3,,,Sun Mar 03 2024 21:52:10 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-128,Tie,expert_26,,,Fri Apr 05 2024 00:27:21 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-128,Tie,expert_26,,,Thu Nov 21 2024 01:57:03 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-128,A,expert_29,,,Fri May 24 2024 18:16:10 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-128,A,expert_29,,,Fri Oct 18 2024 02:29:29 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-128,A,expert_24,,,Mon Apr 01 2024 00:12:21 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-128,A,expert_24,,,Tue Sep 03 2024 05:07:44 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-128,A,expert_10,,,Tue Nov 19 2024 11:47:23 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-128,A,expert_10,,,Thu Dec 12 2024 19:02:06 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-128,A,expert_26,,,Wed Nov 13 2024 06:40:26 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-128,Tie,expert_26,,,Sat Jul 27 2024 04:51:45 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-128,A,expert_47,,,Sun Sep 01 2024 03:22:58 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-128,A,expert_47,,,Mon Jun 17 2024 16:43:46 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-128,Tie,author_6,,,Mon Jan 08 2024 07:35:42 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-128,Tie,author_6,,,Wed Apr 24 2024 14:33:05 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-128,Tie,expert_38,,,Sat Apr 27 2024 00:46:03 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-128,Tie,expert_38,,,Fri Sep 13 2024 14:42:36 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-128,Tie,expert_48,,,Tue Jul 02 2024 06:54:28 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-128,Tie,expert_48,,,Wed Feb 07 2024 18:15:34 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-128,B,expert_37,,,Fri May 17 2024 11:07:34 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-128,B,expert_37,,,Sat Apr 27 2024 07:34:15 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-128,B,expert_5,,,Mon Aug 12 2024 23:35:44 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-128,Tie,expert_5,,,Wed Mar 20 2024 18:56:01 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-128,B,expert_56,,,Mon Jul 01 2024 10:18:40 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-128,B,expert_56,,,Thu Feb 01 2024 08:10:09 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-128,Tie,author_6,,,Mon Apr 01 2024 02:47:16 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-128,Tie,author_6,,,Thu Dec 26 2024 07:12:33 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-128,B,author_6,,,Wed Feb 28 2024 01:56:07 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-128,B,author_6,,,Fri Feb 16 2024 17:40:08 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-128,B,expert_27,,,Tue May 07 2024 02:54:02 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-128,B,expert_27,,,Thu Sep 05 2024 18:39:15 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-129,Tie,expert_39,,,Fri Jul 19 2024 02:05:37 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-129,B,expert_39,,,Mon Oct 28 2024 14:59:09 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-129,Tie,author_2,,,Mon Feb 12 2024 08:42:50 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-129,Tie,author_2,,,Mon Jun 17 2024 22:46:41 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-129,A,author_2,,,Sun Feb 11 2024 03:46:03 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-129,A,author_2,,,Sun May 19 2024 12:26:52 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-129,A,expert_12,,,Wed Sep 04 2024 21:55:24 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-129,A,expert_12,,,Sat Nov 02 2024 22:59:57 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-129,A,author_4,,,Thu Jun 06 2024 20:11:53 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-129,A,author_4,,,Thu Aug 08 2024 00:23:38 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-129,A,expert_25,,,Sat Jan 06 2024 16:42:57 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-129,A,expert_25,,,Wed Jun 05 2024 19:09:47 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-129,A,expert_10,,,Fri Oct 18 2024 07:39:36 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-129,A,expert_10,,,Mon Dec 16 2024 23:05:42 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-129,A,expert_24,,,Mon Dec 23 2024 23:09:42 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-129,A,expert_24,,,Tue Aug 20 2024 03:24:13 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-129,B,expert_46,,,Tue Jan 16 2024 12:54:33 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-129,A,expert_46,,,Sat Sep 07 2024 02:57:19 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-129,A,expert_10,,,Fri Apr 26 2024 09:14:28 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-129,A,expert_10,,,Wed Nov 06 2024 09:34:52 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-129,B,expert_17,,,Fri Aug 16 2024 01:10:01 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-129,Tie,expert_17,,,Wed Dec 04 2024 12:45:21 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-129,B,expert_50,,,Fri Aug 02 2024 16:00:53 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-129,B,expert_50,,,Tue Aug 20 2024 18:51:55 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-129,B,expert_4,,,Sat May 18 2024 13:04:05 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-129,B,expert_4,,,Sun Mar 03 2024 07:16:23 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-129,B,expert_0,,,Sat Jan 27 2024 13:35:00 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-129,B,expert_0,,,Tue Dec 24 2024 21:33:58 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-129,B,expert_13,,,Mon Jan 08 2024 08:38:03 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-129,Tie,expert_13,,,Fri Aug 09 2024 18:45:34 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-129,A,expert_48,,,Sun Nov 24 2024 14:28:01 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-129,Tie,expert_48,,,Sat Jun 15 2024 22:22:18 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-129,B,expert_28,,,Sat Oct 05 2024 10:11:06 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-129,B,expert_28,,,Thu Apr 11 2024 06:27:58 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-129,B,expert_31,,,Sun Dec 22 2024 11:49:58 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-129,B,expert_31,,,Fri Sep 13 2024 20:47:12 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-130,A,expert_41,,,Sat Sep 28 2024 19:22:39 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-130,Tie,expert_41,,,Fri Jul 19 2024 05:58:44 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-130,B,author_0,,,Mon Sep 02 2024 01:42:07 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-130,B,author_0,,,Tue Sep 17 2024 02:29:29 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-130,A,expert_25,,,Mon May 13 2024 18:44:38 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-130,A,expert_25,,,Tue Oct 22 2024 03:31:06 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-130,A,expert_55,,,Tue Oct 08 2024 20:05:57 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-130,A,expert_55,,,Tue Dec 03 2024 16:42:46 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-130,A,expert_3,,,Sun Oct 06 2024 13:04:11 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-130,A,expert_3,,,Wed May 22 2024 15:51:08 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-130,A,expert_0,,,Mon Sep 23 2024 17:49:32 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-130,A,expert_0,,,Wed Apr 03 2024 16:54:25 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-130,A,expert_57,,,Sat Feb 10 2024 02:35:10 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-130,A,expert_57,,,Tue Feb 20 2024 02:26:39 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-130,B,expert_12,,,Tue Apr 02 2024 09:45:18 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-130,Tie,expert_12,,,Fri Mar 01 2024 13:08:44 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-130,A,author_1,,,Mon Apr 15 2024 22:16:06 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-130,A,author_1,,,Fri Nov 15 2024 04:45:06 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-130,A,expert_24,,,Sun Mar 17 2024 08:28:26 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-130,A,expert_24,,,Sun Jul 14 2024 01:04:26 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-130,B,expert_50,,,Tue Nov 05 2024 15:56:37 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-130,A,expert_50,,,Fri Sep 13 2024 14:07:13 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-130,Tie,expert_25,,,Fri Feb 09 2024 12:33:34 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-130,B,expert_25,,,Wed Feb 07 2024 01:19:17 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-130,Tie,expert_13,,,Mon May 06 2024 03:24:08 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-130,B,expert_13,,,Sun Oct 20 2024 21:55:18 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-130,B,author_0,,,Mon Oct 14 2024 15:10:36 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-130,B,author_0,,,Fri Aug 23 2024 11:19:05 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-130,Tie,expert_39,,,Fri Oct 04 2024 09:08:49 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-130,B,expert_39,,,Fri Apr 19 2024 22:05:52 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-130,Tie,author_6,,,Thu Jan 18 2024 04:04:29 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-130,B,author_6,,,Fri Aug 02 2024 07:03:50 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-130,A,expert_38,,,Fri Dec 13 2024 15:18:31 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-130,Tie,expert_38,,,Fri May 10 2024 05:10:49 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-130,A,expert_49,,,Mon Sep 23 2024 12:21:42 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-130,A,expert_49,,,Sat Jun 22 2024 16:31:48 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-130,A,expert_57,,,Sun Sep 22 2024 06:48:11 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-130,A,expert_57,,,Fri Apr 26 2024 18:17:02 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-131,Tie,expert_9,,,Sun Apr 14 2024 17:58:05 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-131,Tie,expert_9,,,Mon Oct 07 2024 06:18:59 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-131,Tie,expert_36,,,Tue Oct 15 2024 02:32:58 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-131,Tie,expert_36,,,Tue Dec 17 2024 01:31:58 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-131,A,expert_12,,,Fri May 10 2024 03:56:19 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-131,A,expert_12,,,Mon Jul 22 2024 21:59:27 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-131,A,expert_38,,,Fri Dec 27 2024 14:00:18 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-131,A,expert_38,,,Tue Dec 10 2024 06:46:45 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-131,Tie,expert_31,,,Fri Dec 06 2024 21:11:52 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-131,Tie,expert_31,,,Wed Aug 21 2024 01:48:36 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-131,A,author_0,,,Wed Aug 28 2024 23:02:36 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-131,A,author_0,,,Mon Sep 16 2024 13:43:31 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-131,A,expert_20,,,Sat Feb 24 2024 00:58:52 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-131,A,expert_20,,,Sat Apr 27 2024 11:03:59 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-131,A,expert_24,,,Wed Jul 10 2024 05:32:55 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-131,A,expert_24,,,Sun Jun 02 2024 00:19:56 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-131,A,expert_42,,,Sun Jan 28 2024 18:52:15 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-131,A,expert_42,,,Sun Sep 08 2024 22:40:04 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-131,Tie,expert_24,,,Wed May 22 2024 07:40:15 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-131,Tie,expert_24,,,Tue May 28 2024 00:20:31 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-131,B,expert_0,,,Wed Jul 03 2024 15:04:40 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-131,A,expert_0,,,Wed Jan 24 2024 17:28:04 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-131,A,expert_15,,,Wed Jan 03 2024 04:29:08 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-131,B,author_3,,,Sat Oct 05 2024 11:51:41 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-131,B,author_3,,,Sun Aug 25 2024 23:39:07 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-131,A,expert_26,,,Thu Jun 27 2024 15:27:14 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-131,B,expert_26,,,Sun Oct 27 2024 03:21:50 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-131,Tie,expert_3,,,Tue Jul 09 2024 20:23:07 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-131,Tie,expert_3,,,Fri May 10 2024 04:41:47 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-131,A,expert_51,,,Tue Oct 15 2024 01:54:10 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-131,A,expert_51,,,Thu Dec 19 2024 01:52:26 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-131,B,expert_14,,,Sun May 19 2024 20:15:01 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-131,B,expert_14,,,Wed Dec 04 2024 00:55:58 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-132,Tie,expert_34,,,Sat Sep 14 2024 06:04:17 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-132,Tie,expert_34,,,Thu Aug 08 2024 03:38:14 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-132,Tie,expert_47,,,Fri Jul 12 2024 17:21:30 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-132,Tie,expert_47,,,Sat Oct 05 2024 14:38:40 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-132,B,expert_42,,,Sat Aug 10 2024 04:42:58 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-132,A,expert_42,,,Fri Nov 22 2024 17:32:56 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-132,Tie,expert_46,,,Tue Jul 09 2024 21:08:46 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-132,A,expert_46,,,Thu Aug 01 2024 19:14:00 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-132,Tie,author_2,,,Fri Oct 04 2024 21:13:41 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-132,A,author_2,,,Tue Mar 12 2024 04:19:37 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-132,Tie,expert_24,,,Fri Jun 14 2024 02:52:39 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-132,B,expert_24,,,Sat Mar 16 2024 22:38:35 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-132,Tie,expert_49,,,Sun Dec 01 2024 23:28:27 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-132,B,expert_49,,,Fri Jan 26 2024 09:59:33 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-132,A,expert_3,,,Mon Nov 11 2024 17:13:52 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-132,B,expert_3,,,Sat Oct 12 2024 03:02:58 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-132,B,author_3,,,Fri Jan 19 2024 23:54:55 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-132,B,author_3,,,Sun Jan 14 2024 13:03:40 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-132,B,author_4,,,Sat May 25 2024 02:13:42 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-132,B,author_4,,,Sun May 19 2024 06:33:03 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-132,B,author_2,,,Fri Dec 13 2024 02:24:35 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-132,A,author_2,,,Sun Jan 28 2024 13:12:02 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-132,B,expert_10,,,Sat Jun 15 2024 20:13:23 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-132,B,expert_10,,,Fri Sep 20 2024 21:36:11 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-132,Tie,expert_2,,,Tue Jun 18 2024 10:32:09 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-132,B,expert_2,,,Sun Nov 03 2024 13:44:21 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-132,Tie,expert_6,,,Sun Apr 21 2024 14:33:15 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-132,B,expert_6,,,Thu Aug 01 2024 14:32:53 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-133,B,expert_27,,,Fri May 17 2024 21:23:54 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-133,B,expert_27,,,Thu Apr 04 2024 14:16:08 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-133,Tie,expert_49,,,Fri Dec 20 2024 07:29:03 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-133,B,expert_49,,,Sat Jul 27 2024 15:39:23 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-133,A,expert_7,,,Mon Oct 14 2024 00:59:46 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-133,A,expert_7,,,Tue Jun 18 2024 06:52:03 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-133,B,expert_7,,,Sat May 04 2024 07:36:06 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-133,B,expert_7,,,Wed Aug 28 2024 11:32:52 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-133,B,expert_9,,,Sat Sep 28 2024 20:56:43 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-133,Tie,expert_9,,,Fri Oct 25 2024 10:11:59 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-133,Tie,expert_12,,,Fri Jan 19 2024 00:15:07 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-133,A,expert_12,,,Sat Jun 01 2024 23:21:38 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-133,Tie,expert_54,,,Tue Sep 24 2024 05:45:58 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-133,Tie,expert_54,,,Fri Jun 14 2024 00:44:42 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-133,Tie,expert_45,,,Fri Jul 05 2024 05:28:16 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-133,B,expert_45,,,Thu Apr 25 2024 12:01:42 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-133,A,expert_35,,,Sun Nov 24 2024 10:14:30 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-133,A,expert_35,,,Wed Oct 02 2024 07:08:14 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-133,A,expert_23,,,Sat Apr 20 2024 03:09:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-133,B,expert_23,,,Mon Jun 24 2024 09:26:31 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-133,A,expert_8,,,Fri Jul 12 2024 23:55:42 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-133,A,expert_8,,,Wed Dec 11 2024 08:58:36 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-133,A,expert_12,,,Thu Nov 28 2024 18:40:08 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-133,Tie,expert_12,,,Thu Jan 04 2024 13:19:11 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-133,A,expert_24,,,Sun Sep 15 2024 12:49:05 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-133,A,expert_24,,,Wed Feb 07 2024 05:23:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-133,Tie,author_0,,,Fri Apr 19 2024 19:33:34 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-133,A,author_0,,,Mon Jul 15 2024 04:17:21 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-133,B,expert_28,,,Fri Aug 16 2024 14:56:53 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-133,A,expert_28,,,Mon Dec 16 2024 02:56:18 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-133,Tie,expert_15,,,Tue Sep 17 2024 14:56:21 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-133,A,expert_15,,,Wed Nov 27 2024 03:01:42 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-133,A,expert_8,,,Sat Dec 07 2024 22:46:10 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-133,A,expert_8,,,Tue Dec 17 2024 11:08:27 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-133,Tie,expert_26,,,Wed Oct 02 2024 16:26:46 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-133,B,expert_26,,,Mon May 20 2024 02:07:52 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-133,Tie,expert_29,,,Wed Apr 03 2024 23:06:55 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-133,B,expert_29,,,Mon Oct 14 2024 00:06:32 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-133,Tie,author_4,,,Mon Feb 12 2024 11:07:55 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-133,Tie,author_4,,,Fri Jan 26 2024 10:15:44 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-133,B,expert_2,,,Sun May 19 2024 09:40:43 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-133,B,expert_2,,,Sat Jul 27 2024 06:25:15 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-133,B,expert_29,,,Sat Aug 24 2024 09:57:22 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-133,B,expert_29,,,Mon Nov 25 2024 04:44:44 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-133,B,author_4,,,Thu Jun 27 2024 08:58:26 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-133,B,author_4,,,Sat Jan 20 2024 17:18:34 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-133,B,expert_26,,,Mon May 20 2024 00:38:46 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-133,B,expert_26,,,Thu Jan 04 2024 08:35:51 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-133,B,expert_15,,,Tue Dec 03 2024 00:07:56 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-133,B,expert_15,,,Mon Jul 01 2024 03:06:11 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-133,A,author_2,,,Tue Aug 20 2024 18:52:30 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-133,A,author_2,,,Sun Apr 07 2024 13:03:57 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-133,B,author_4,,,Mon Oct 28 2024 16:28:09 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-133,B,author_4,,,Fri Sep 20 2024 00:18:21 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-133,B,expert_40,,,Sat Aug 24 2024 02:13:09 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-133,B,expert_40,,,Wed Jul 17 2024 14:50:44 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-134,B,author_3,,,Sat Jun 15 2024 06:19:11 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-134,B,author_3,,,Thu Apr 25 2024 14:34:17 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-134,Tie,author_0,,,Sat Sep 28 2024 03:04:01 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-134,B,author_0,,,Wed Mar 20 2024 23:26:22 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-134,Tie,expert_0,,,Tue Feb 06 2024 17:40:10 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-134,B,expert_0,,,Sun Aug 11 2024 09:44:10 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-134,Tie,expert_10,,,Sat Jul 20 2024 15:05:53 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-134,Tie,expert_10,,,Sat Apr 06 2024 15:12:16 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-134,A,expert_49,,,Sat Jan 06 2024 16:29:49 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-134,A,expert_49,,,Wed Jun 19 2024 01:41:42 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-134,A,expert_11,,,Fri Jun 14 2024 10:15:14 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-134,A,expert_11,,,Sat Dec 28 2024 23:53:55 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-134,Tie,author_4,,,Wed Sep 25 2024 05:30:59 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-134,A,author_4,,,Tue Apr 23 2024 08:26:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-134,B,author_0,,,Sun Mar 03 2024 05:12:58 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-134,Tie,author_0,,,Wed May 08 2024 17:44:45 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-134,B,expert_11,,,Thu Sep 05 2024 02:04:57 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-134,Tie,expert_11,,,Thu Jun 27 2024 05:55:08 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-134,B,expert_29,,,Thu Nov 21 2024 13:16:17 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-134,A,expert_29,,,Tue Mar 26 2024 10:08:10 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-134,Tie,author_4,,,Wed Jan 24 2024 13:13:41 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-134,A,author_4,,,Thu Mar 07 2024 04:55:00 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-134,Tie,expert_48,,,Sat Mar 02 2024 11:58:17 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-134,B,expert_42,,,Sun Jan 28 2024 10:15:15 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-134,A,expert_42,,,Sat Jun 01 2024 16:58:37 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-134,A,author_5,,,Fri Nov 08 2024 21:18:14 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-134,A,author_5,,,Sun May 05 2024 19:53:10 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-134,Tie,author_3,,,Fri Jan 05 2024 10:30:22 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-134,Tie,author_3,,,Wed Feb 28 2024 13:55:47 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-134,A,expert_42,,,Sat Nov 02 2024 11:56:05 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-134,Tie,expert_42,,,Mon May 20 2024 07:50:32 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-134,A,expert_3,,,Tue Aug 13 2024 11:47:19 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-134,A,expert_3,,,Sat Nov 02 2024 12:54:54 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-134,A,expert_42,,,Tue Feb 27 2024 11:49:33 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-134,A,expert_42,,,Fri Aug 09 2024 00:36:21 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-134,A,expert_6,,,Mon Aug 12 2024 04:25:46 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-134,A,expert_6,,,Sat Jun 01 2024 19:33:47 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-134,A,expert_45,,,Mon Mar 11 2024 17:04:02 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-134,A,expert_45,,,Mon Mar 18 2024 11:32:34 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-134,B,expert_27,,,Fri Jul 19 2024 08:05:30 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-134,B,expert_27,,,Thu Apr 25 2024 11:54:26 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-134,Tie,author_3,,,Thu Mar 07 2024 17:19:43 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-134,B,author_3,,,Sat Oct 12 2024 02:37:34 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-134,A,expert_51,,,Tue Sep 10 2024 08:36:55 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-134,B,expert_51,,,Wed Jan 24 2024 15:10:25 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-134,A,expert_17,,,Thu Aug 22 2024 08:19:39 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-134,A,expert_17,,,Sat Oct 19 2024 08:43:15 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-134,A,expert_17,,,Sun Feb 11 2024 11:03:46 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-134,B,expert_17,,,Tue Jan 23 2024 23:49:11 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-134,A,author_5,,,Mon Jul 08 2024 14:26:04 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-134,Tie,author_5,,,Wed Jun 19 2024 02:18:35 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-135,B,author_4,,,Wed Dec 18 2024 19:57:49 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-135,B,author_4,,,Thu Mar 07 2024 13:54:52 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-135,B,expert_37,,,Fri Apr 19 2024 10:50:01 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-135,B,expert_37,,,Wed Jan 10 2024 18:45:21 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-135,A,expert_0,,,Fri Nov 08 2024 06:09:58 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-135,A,expert_0,,,Sat Sep 14 2024 20:53:26 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-135,Tie,expert_9,,,Wed Feb 21 2024 10:34:20 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-135,B,expert_9,,,Thu Jul 11 2024 17:24:37 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-135,A,expert_50,,,Mon Oct 28 2024 17:34:30 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-135,A,expert_50,,,Tue Jun 25 2024 20:56:09 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-135,Tie,expert_2,,,Mon Feb 19 2024 01:53:40 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-135,A,expert_2,,,Tue Apr 09 2024 01:35:16 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-135,A,expert_24,,,Mon Jun 24 2024 16:53:54 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-135,A,expert_24,,,Sat Feb 03 2024 08:26:20 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-135,A,expert_24,,,Mon Dec 23 2024 16:29:01 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-135,A,expert_24,,,Sun Aug 04 2024 12:53:38 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-135,B,expert_24,,,Thu Feb 15 2024 12:53:32 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-135,A,expert_24,,,Sun Feb 04 2024 11:16:21 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-135,A,expert_35,,,Tue Apr 09 2024 14:04:11 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-135,A,expert_35,,,Mon Apr 22 2024 01:29:43 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-135,Tie,author_4,,,Sun Feb 25 2024 17:19:31 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-135,B,author_4,,,Thu May 09 2024 21:19:41 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-135,B,expert_28,,,Fri Nov 08 2024 18:35:46 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-135,B,expert_28,,,Sat Mar 09 2024 21:15:08 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-135,A,expert_23,,,Mon Oct 28 2024 11:03:55 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-135,B,expert_23,,,Mon Jul 15 2024 03:39:07 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-135,Tie,expert_48,,,Sat Dec 07 2024 04:21:36 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-135,B,expert_48,,,Sat Mar 09 2024 12:30:02 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-135,A,author_2,,,Wed Aug 21 2024 11:34:09 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-135,Tie,author_2,,,Thu Mar 28 2024 01:53:07 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-136,B,expert_16,,,Wed Sep 18 2024 04:25:56 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-136,B,expert_16,,,Fri Aug 23 2024 05:31:39 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-136,B,expert_15,,,Fri May 24 2024 21:39:49 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-136,B,expert_15,,,Thu Apr 18 2024 04:19:55 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-136,Tie,expert_22,,,Fri May 24 2024 02:35:25 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-136,Tie,expert_22,,,Fri Jul 05 2024 05:03:00 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-136,A,expert_0,,,Sun Jan 14 2024 05:03:00 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-136,A,expert_0,,,Sat May 18 2024 22:38:32 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-136,Tie,expert_0,,,Thu Jul 25 2024 17:22:59 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-136,A,expert_0,,,Fri Sep 13 2024 18:35:58 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-136,Tie,author_0,,,Fri Mar 08 2024 14:35:26 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-136,Tie,author_0,,,Sun Feb 11 2024 23:41:17 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-136,A,expert_3,,,Mon Dec 02 2024 08:08:41 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-136,Tie,expert_3,,,Sat Jun 15 2024 21:52:51 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-136,A,expert_36,,,Mon Oct 14 2024 10:16:00 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-136,Tie,expert_36,,,Tue Jun 25 2024 04:01:21 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-136,Tie,expert_11,,,Thu Jun 20 2024 01:29:04 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-136,A,expert_11,,,Fri Jan 05 2024 04:57:29 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-136,Tie,expert_25,,,Sat Feb 03 2024 18:04:25 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-136,Tie,expert_25,,,Tue Mar 19 2024 20:44:13 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-136,Tie,expert_5,,,Thu Feb 08 2024 06:55:20 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-136,Tie,expert_5,,,Sun Aug 04 2024 20:36:02 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-136,A,expert_29,,,Thu May 09 2024 16:32:26 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-136,B,expert_29,,,Sat Nov 09 2024 10:31:08 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-136,A,author_4,,,Wed Apr 10 2024 06:00:25 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-136,Tie,author_4,,,Sat Feb 10 2024 17:13:56 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-136,A,expert_55,,,Mon Apr 22 2024 11:24:39 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-136,A,expert_55,,,Wed Aug 28 2024 10:42:48 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-136,Tie,expert_45,,,Thu Jan 25 2024 21:10:34 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-136,A,expert_45,,,Wed Dec 04 2024 03:25:21 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-136,B,expert_50,,,Mon Apr 08 2024 21:20:56 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-136,B,expert_50,,,Thu Jun 06 2024 10:19:29 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-136,A,expert_10,,,Mon Aug 05 2024 18:00:17 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-136,Tie,expert_10,,,Sun Nov 24 2024 04:03:23 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-136,Tie,expert_47,,,Wed Nov 20 2024 09:41:53 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-136,Tie,expert_47,,,Sat Oct 26 2024 11:09:29 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-136,B,expert_27,,,Wed Nov 20 2024 04:12:52 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-136,Tie,expert_27,,,Sun Jul 14 2024 00:58:46 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-136,B,expert_7,,,Sat Apr 27 2024 03:30:00 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-136,B,expert_7,,,Mon Dec 23 2024 03:51:41 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-136,A,expert_0,,,Wed May 15 2024 18:45:38 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-136,A,expert_0,,,Sun May 05 2024 00:34:50 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-137,B,expert_53,,,Thu Jun 27 2024 04:48:11 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-137,B,expert_53,,,Fri Aug 09 2024 17:33:08 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-137,B,author_0,,,Fri Apr 26 2024 20:53:37 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-137,B,author_0,,,Sun Oct 06 2024 07:06:37 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-137,B,expert_22,,,Sun Jan 21 2024 20:14:14 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-137,B,expert_22,,,Fri Mar 01 2024 00:49:48 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-137,Tie,expert_2,,,Thu Mar 21 2024 05:26:24 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-137,B,expert_2,,,Tue Jun 18 2024 05:06:05 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-137,B,expert_50,,,Fri Mar 15 2024 15:27:45 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-137,B,expert_50,,,Mon Feb 05 2024 19:36:45 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-137,A,author_4,,,Thu Jan 11 2024 05:22:45 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-137,A,author_4,,,Thu Mar 28 2024 23:32:56 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-137,B,expert_22,,,Mon Jul 01 2024 16:06:36 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-137,A,expert_22,,,Fri Sep 06 2024 12:15:31 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-137,A,expert_22,,,Sat Jun 01 2024 11:29:35 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-137,Tie,expert_39,,,Wed Jan 24 2024 14:44:44 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-137,A,expert_39,,,Thu Aug 15 2024 23:41:32 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-137,A,expert_24,,,Tue Jul 02 2024 20:45:30 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-137,Tie,expert_24,,,Wed Sep 25 2024 08:35:18 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-137,Tie,expert_37,,,Wed Nov 20 2024 21:01:35 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-137,A,expert_37,,,Thu Dec 26 2024 09:38:19 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-137,A,author_2,,,Thu Nov 28 2024 06:24:04 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-137,A,author_2,,,Fri Dec 13 2024 05:08:43 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-137,A,expert_19,,,Sun Jan 21 2024 22:19:13 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-137,A,expert_19,,,Wed Aug 21 2024 09:22:06 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-137,A,expert_2,,,Fri Mar 15 2024 21:00:47 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-137,A,expert_2,,,Sun Jun 16 2024 13:20:50 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-137,B,expert_24,,,Fri Feb 09 2024 17:47:31 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-137,B,expert_24,,,Sun Sep 08 2024 00:25:12 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-137,B,expert_4,,,Tue Jun 11 2024 03:16:37 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-137,B,expert_4,,,Sun Apr 21 2024 20:23:21 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-137,A,author_2,,,Thu Mar 21 2024 09:11:38 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-137,Tie,author_2,,,Wed May 08 2024 04:24:43 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-137,A,author_5,,,Thu Jul 25 2024 19:08:36 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-137,Tie,author_5,,,Thu Dec 26 2024 08:10:23 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-137,Tie,expert_24,,,Wed Jun 05 2024 22:05:24 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-137,B,expert_24,,,Sat Oct 19 2024 12:30:16 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-137,B,expert_41,,,Sun Apr 28 2024 15:53:07 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-137,B,expert_41,,,Sat Feb 10 2024 23:50:25 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-137,B,expert_9,,,Fri Feb 23 2024 16:54:10 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-137,B,expert_9,,,Wed Apr 10 2024 15:36:35 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-137,B,author_3,,,Sun Jul 21 2024 08:21:25 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-137,B,author_3,,,Sun Oct 20 2024 01:29:51 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-137,A,author_6,,,Tue Mar 26 2024 07:53:30 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-137,Tie,author_6,,,Sat Jul 20 2024 12:02:47 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-138,B,expert_44,,,Thu Sep 12 2024 06:25:00 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-138,B,expert_44,,,Wed Aug 07 2024 22:15:44 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-138,B,author_4,,,Sat Nov 02 2024 09:49:11 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-138,B,author_4,,,Tue Feb 13 2024 21:22:48 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-138,A,expert_3,,,Tue Oct 22 2024 19:09:02 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-138,Tie,expert_3,,,Fri Jun 07 2024 22:39:50 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-138,A,expert_56,,,Wed Jun 26 2024 00:07:52 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-138,A,expert_56,,,Wed May 15 2024 19:35:54 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-138,A,author_0,,,Fri Oct 11 2024 08:56:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-138,Tie,author_0,,,Tue Mar 26 2024 00:00:20 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-138,Tie,author_0,,,Mon Aug 12 2024 03:05:23 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-138,Tie,author_0,,,Fri Oct 18 2024 17:19:24 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-138,A,expert_24,,,Fri Jan 05 2024 08:30:51 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-138,A,expert_24,,,Sun Feb 11 2024 22:15:25 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-138,A,author_0,,,Fri May 03 2024 03:57:57 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-138,A,author_0,,,Wed May 15 2024 04:03:51 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-138,A,author_3,,,Mon Jun 03 2024 03:42:54 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-138,A,author_3,,,Fri Sep 06 2024 16:32:11 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-138,B,expert_6,,,Sat Oct 12 2024 06:08:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-138,Tie,expert_6,,,Sat May 25 2024 13:29:32 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-138,A,expert_1,,,Tue Sep 24 2024 17:49:28 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-138,A,expert_1,,,Sat Dec 14 2024 07:37:09 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-138,B,author_4,,,Fri Mar 22 2024 06:34:25 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-138,B,author_4,,,Sun Feb 18 2024 03:03:01 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-138,Tie,expert_24,,,Wed Aug 28 2024 23:57:40 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-138,A,expert_24,,,Thu Feb 08 2024 01:13:13 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-138,B,expert_22,,,Fri Aug 09 2024 16:12:31 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-138,A,expert_22,,,Fri Jun 07 2024 05:20:55 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-138,A,expert_51,,,Thu Sep 12 2024 06:29:15 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-138,A,expert_51,,,Sun Nov 24 2024 08:29:53 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-138,B,author_4,,,Mon Feb 19 2024 01:01:02 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-138,B,author_4,,,Tue Apr 02 2024 10:36:13 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-138,A,expert_42,,,Fri Oct 04 2024 01:12:53 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-138,B,expert_42,,,Mon Oct 28 2024 14:19:21 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-139,B,expert_46,,,Mon Apr 22 2024 13:41:17 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-139,A,expert_46,,,Mon Jan 22 2024 21:28:26 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-139,A,expert_12,,,Sat Jan 06 2024 03:39:49 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-139,A,expert_12,,,Thu Jul 18 2024 17:54:08 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-139,A,expert_15,,,Sun Sep 15 2024 09:45:14 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-139,A,expert_15,,,Thu Dec 19 2024 09:55:16 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-139,A,expert_8,,,Fri Oct 25 2024 07:06:26 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-139,A,expert_8,,,Wed Nov 20 2024 04:21:41 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-139,A,expert_32,,,Wed Mar 13 2024 15:42:05 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-139,Tie,expert_32,,,Fri Jun 28 2024 21:35:20 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-139,A,expert_39,,,Thu Feb 22 2024 22:54:49 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-139,A,expert_46,,,Fri Jan 19 2024 12:23:02 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-139,A,expert_46,,,Mon Jan 22 2024 19:47:00 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-139,A,expert_0,,,Sat May 18 2024 18:56:24 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-139,A,expert_0,,,Tue May 07 2024 09:24:26 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-139,A,expert_6,,,Fri Nov 15 2024 23:48:36 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-139,A,expert_6,,,Sun Aug 25 2024 13:48:25 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-139,A,expert_26,,,Tue Dec 24 2024 12:33:29 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-139,A,expert_26,,,Thu Aug 22 2024 15:05:51 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-139,A,expert_25,,,Tue Jan 23 2024 00:57:02 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-139,A,expert_25,,,Tue Feb 06 2024 13:59:58 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-139,B,author_2,,,Sat Apr 13 2024 17:59:57 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-139,Tie,author_2,,,Fri Jul 05 2024 11:14:22 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-139,B,expert_15,,,Mon May 27 2024 23:34:40 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-139,B,expert_15,,,Sat Oct 19 2024 04:16:36 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-139,Tie,expert_34,,,Thu Jul 11 2024 06:47:43 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-139,Tie,expert_34,,,Sat Jul 20 2024 19:26:37 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-139,Tie,author_2,,,Mon Nov 25 2024 10:16:31 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-139,B,author_2,,,Thu Jun 13 2024 18:48:34 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-139,B,expert_20,,,Mon May 06 2024 17:35:44 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-139,B,expert_20,,,Sun Jan 07 2024 01:00:35 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-139,B,expert_53,,,Sun Aug 18 2024 16:05:44 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-139,B,expert_53,,,Mon Jan 01 2024 08:13:35 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-139,B,author_5,,,Tue Sep 24 2024 05:57:08 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-139,B,author_5,,,Sun Feb 18 2024 23:43:17 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-140,B,author_0,,,Mon Sep 09 2024 00:36:19 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-140,B,author_0,,,Sun Nov 24 2024 09:33:17 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-140,A,expert_35,,,Thu May 16 2024 03:20:02 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-140,Tie,expert_35,,,Sat Nov 02 2024 14:12:28 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-140,B,expert_41,,,Thu Dec 05 2024 04:04:38 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-140,B,expert_41,,,Mon Dec 02 2024 07:49:26 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-140,A,expert_32,,,Tue Mar 26 2024 18:59:18 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-140,B,expert_32,,,Wed Aug 21 2024 03:05:50 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-140,Tie,expert_18,,,Tue Jun 18 2024 08:11:43 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-140,B,expert_18,,,Sun Mar 17 2024 13:54:36 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-140,A,expert_44,,,Mon Jul 15 2024 12:53:08 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-140,A,expert_44,,,Fri Sep 13 2024 14:09:27 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-140,A,expert_25,,,Tue Mar 05 2024 03:24:59 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-140,A,expert_25,,,Mon Feb 26 2024 01:21:52 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-140,A,expert_44,,,Sat Oct 26 2024 16:49:03 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-140,A,expert_44,,,Tue Jul 16 2024 21:09:36 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-140,B,expert_38,,,Sat Dec 28 2024 15:28:35 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-140,B,expert_38,,,Fri Nov 08 2024 15:49:47 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-140,A,author_4,,,Sat Apr 20 2024 16:10:08 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-140,A,author_4,,,Fri Sep 13 2024 13:59:10 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-140,Tie,expert_43,,,Wed Mar 06 2024 20:57:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-140,A,expert_43,,,Mon May 13 2024 11:43:20 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-140,Tie,expert_20,,,Thu Oct 03 2024 20:49:36 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-140,Tie,expert_20,,,Tue May 28 2024 16:11:44 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-140,Tie,expert_12,,,Thu Nov 07 2024 20:03:00 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-140,Tie,expert_12,,,Sun Jul 07 2024 12:52:23 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-140,A,expert_34,,,Thu Oct 17 2024 16:30:17 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-140,Tie,expert_34,,,Sat May 11 2024 16:56:04 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-140,A,author_0,,,Tue Aug 13 2024 05:36:03 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-140,A,author_0,,,Sun Sep 22 2024 02:45:16 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-140,B,author_0,,,Thu Sep 05 2024 14:34:29 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-140,B,author_0,,,Thu Sep 05 2024 03:05:12 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-140,B,expert_26,,,Tue Oct 15 2024 04:09:06 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-140,B,expert_26,,,Tue Oct 01 2024 15:25:45 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-140,B,expert_28,,,Thu Sep 05 2024 11:36:28 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-140,B,expert_28,,,Mon Feb 26 2024 11:43:06 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-140,B,expert_31,,,Mon Sep 02 2024 13:44:13 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-140,B,expert_31,,,Mon Oct 28 2024 22:23:44 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-140,B,expert_11,,,Sat Jul 27 2024 17:13:59 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-140,B,expert_11,,,Wed Jul 10 2024 11:28:12 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-140,Tie,expert_19,,,Tue Oct 15 2024 06:44:18 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-140,B,expert_19,,,Fri Oct 25 2024 03:27:40 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-140,B,expert_21,,,Wed Aug 28 2024 12:50:07 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-140,B,expert_21,,,Fri Nov 08 2024 22:43:06 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-140,B,expert_4,,,Sun Jan 07 2024 09:36:57 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-140,B,expert_4,,,Sat Aug 17 2024 06:17:11 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-140,A,expert_42,,,Thu Jul 04 2024 20:12:30 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-140,A,expert_42,,,Tue Mar 12 2024 04:02:06 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-141,A,expert_26,,,Tue Feb 06 2024 19:16:49 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-141,A,expert_26,,,Sun Jun 23 2024 15:43:04 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-141,A,expert_55,,,Tue Mar 12 2024 07:57:10 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-141,A,expert_55,,,Wed Feb 28 2024 05:51:41 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-141,Tie,expert_31,,,Sat Mar 23 2024 03:41:53 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-141,B,expert_31,,,Thu Jan 04 2024 22:31:27 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-141,A,expert_31,,,Mon Aug 26 2024 17:29:01 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-141,A,expert_31,,,Mon Sep 16 2024 21:12:10 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-141,Tie,expert_9,,,Sun Oct 27 2024 19:13:39 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-141,A,expert_9,,,Sun Nov 17 2024 21:02:14 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-141,A,author_4,,,Wed Nov 27 2024 01:30:02 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-141,A,author_4,,,Wed Mar 27 2024 00:59:47 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-141,Tie,author_4,,,Mon Apr 08 2024 23:45:35 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-141,B,author_4,,,Mon Jul 22 2024 02:36:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-141,B,expert_29,,,Mon Nov 25 2024 19:06:08 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-141,B,expert_29,,,Thu Jun 20 2024 05:38:41 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-141,A,expert_53,,,Mon Nov 18 2024 22:16:31 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-141,Tie,expert_53,,,Tue Apr 16 2024 03:08:03 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-141,Tie,author_4,,,Mon May 27 2024 22:58:38 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-141,Tie,author_4,,,Fri Jun 21 2024 09:18:05 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-141,A,expert_4,,,Sat May 25 2024 12:59:52 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-141,A,expert_4,,,Fri Feb 02 2024 16:06:17 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-141,Tie,expert_18,,,Tue Apr 16 2024 06:39:29 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-141,A,expert_18,,,Sat Feb 03 2024 11:16:51 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-141,B,expert_20,,,Mon Jun 10 2024 05:42:34 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-141,A,expert_20,,,Mon Apr 08 2024 18:07:41 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-141,A,expert_5,,,Sun Dec 08 2024 08:52:21 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-141,A,expert_5,,,Thu Aug 08 2024 14:55:54 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-141,B,author_0,,,Sun Dec 15 2024 01:27:30 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-141,B,author_0,,,Wed Feb 21 2024 03:39:18 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-141,B,expert_24,,,Fri Jun 07 2024 02:51:26 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-141,B,expert_24,,,Thu Aug 08 2024 08:07:14 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-141,B,author_3,,,Tue Dec 24 2024 17:50:09 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-141,B,author_3,,,Wed Apr 24 2024 22:01:31 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-141,B,expert_20,,,Fri Mar 22 2024 05:24:57 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-141,B,expert_20,,,Tue May 14 2024 18:11:25 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-142,Tie,expert_0,,,Sat May 11 2024 21:12:10 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-142,B,expert_0,,,Tue Sep 03 2024 03:10:00 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-142,A,expert_20,,,Mon Oct 14 2024 03:59:38 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-142,B,expert_20,,,Sat Mar 23 2024 18:21:02 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-142,B,author_0,,,Tue Jul 09 2024 08:50:31 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-142,B,author_0,,,Wed Mar 06 2024 19:53:35 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-142,B,expert_25,,,Thu Jul 18 2024 02:58:18 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-142,A,expert_25,,,Mon May 13 2024 15:58:21 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-142,Tie,author_4,,,Tue Dec 10 2024 08:23:33 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-142,A,author_4,,,Wed Feb 28 2024 11:49:41 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-142,A,expert_25,,,Sun Feb 25 2024 07:51:36 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-142,B,expert_25,,,Tue Dec 10 2024 19:48:25 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-142,B,expert_8,,,Mon Feb 26 2024 21:37:50 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-142,B,expert_8,,,Tue Nov 19 2024 17:11:08 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-142,B,author_4,,,Sun Aug 04 2024 19:31:14 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-142,B,author_4,,,Mon Aug 26 2024 23:16:01 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-142,Tie,expert_48,,,Sun Dec 08 2024 05:27:56 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-142,B,expert_48,,,Tue Oct 15 2024 12:04:34 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-142,B,expert_7,,,Sat Jun 22 2024 03:54:41 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-142,B,expert_7,,,Mon Aug 05 2024 14:01:41 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-142,A,author_0,,,Tue May 14 2024 06:16:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-142,A,author_0,,,Fri Nov 01 2024 07:17:24 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-142,B,expert_15,,,Mon Jun 03 2024 07:32:55 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-142,A,expert_15,,,Sat Oct 26 2024 04:22:47 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-142,A,expert_16,,,Wed Feb 21 2024 03:58:54 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-142,A,expert_16,,,Wed Mar 20 2024 08:11:24 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-142,A,expert_39,,,Sun Nov 24 2024 23:29:46 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-142,A,expert_39,,,Sun Oct 13 2024 03:56:38 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-142,A,author_2,,,Thu Nov 21 2024 17:03:22 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-142,A,author_2,,,Mon Mar 18 2024 01:35:07 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-142,B,expert_0,,,Tue Jun 18 2024 02:21:11 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-142,A,expert_15,,,Fri Oct 04 2024 06:24:26 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-142,A,expert_15,,,Sun Aug 25 2024 09:54:12 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-142,A,expert_14,,,Mon Jun 17 2024 09:51:27 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-142,A,expert_14,,,Mon Jul 08 2024 13:29:06 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-142,A,expert_41,,,Mon Oct 21 2024 16:45:25 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-142,Tie,expert_41,,,Thu Feb 08 2024 10:03:41 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-142,B,expert_12,,,Wed May 01 2024 20:34:35 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-142,Tie,expert_12,,,Sun Jan 21 2024 08:29:43 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-142,B,expert_41,,,Tue May 14 2024 17:41:52 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-142,B,expert_41,,,Tue Aug 13 2024 17:56:38 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-142,B,expert_51,,,Sun Dec 08 2024 15:56:10 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-142,B,expert_51,,,Sun Feb 18 2024 11:20:19 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-142,B,expert_39,,,Sun Aug 25 2024 05:31:46 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-142,B,expert_39,,,Thu Feb 01 2024 19:45:50 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-142,B,expert_44,,,Sun Jan 21 2024 21:49:40 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-142,B,expert_44,,,Fri Apr 12 2024 14:23:39 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-142,A,author_5,,,Tue Oct 15 2024 01:03:57 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-142,A,author_5,,,Mon Feb 12 2024 03:57:52 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-142,B,expert_4,,,Thu Jul 25 2024 00:34:12 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-142,B,expert_4,,,Fri Dec 27 2024 21:25:49 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-142,A,expert_39,,,Mon Nov 11 2024 15:15:25 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-142,A,expert_39,,,Fri Sep 27 2024 08:18:23 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-143,B,expert_17,,,Sat Nov 23 2024 18:55:57 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-143,B,expert_17,,,Thu Nov 14 2024 04:28:14 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-143,A,author_3,,,Sun Aug 11 2024 11:53:45 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-143,B,author_3,,,Mon Jun 24 2024 15:47:24 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-143,B,expert_38,,,Thu Aug 01 2024 19:52:10 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-143,B,expert_38,,,Sat Jan 20 2024 12:03:38 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-143,A,expert_56,,,Thu Jul 04 2024 03:39:30 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-143,B,expert_56,,,Fri Oct 25 2024 12:53:47 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-143,A,expert_55,,,Wed Sep 25 2024 21:09:49 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-143,A,expert_55,,,Sun Jan 21 2024 23:18:24 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-143,B,expert_36,,,Thu Sep 19 2024 13:06:24 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-143,A,expert_24,,,Fri Oct 04 2024 08:00:07 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-143,A,expert_24,,,Wed Sep 04 2024 04:38:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-143,B,author_4,,,Sat Jun 15 2024 16:54:58 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-143,B,author_4,,,Sat Nov 23 2024 00:29:52 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-143,Tie,author_0,,,Mon Jul 15 2024 21:33:29 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-143,A,expert_47,,,Tue Aug 13 2024 23:57:36 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-143,Tie,expert_47,,,Sun Jan 21 2024 07:55:47 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-143,A,expert_11,,,Fri Apr 05 2024 13:31:29 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-143,A,expert_11,,,Tue Feb 20 2024 10:38:23 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-143,A,expert_55,,,Sat Jul 20 2024 13:53:07 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-143,A,expert_55,,,Tue Mar 26 2024 03:30:51 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-143,B,expert_0,,,Tue Feb 27 2024 01:44:37 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-143,B,expert_0,,,Tue Mar 26 2024 14:06:51 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-143,B,expert_9,,,Mon Dec 23 2024 09:17:11 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-143,B,expert_9,,,Sun May 19 2024 11:58:06 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-143,A,expert_11,,,Thu Mar 28 2024 00:39:10 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-143,Tie,expert_11,,,Sat Jul 20 2024 09:28:35 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-143,B,expert_25,,,Tue Nov 12 2024 03:09:19 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-143,B,expert_25,,,Fri Dec 27 2024 22:41:35 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-143,B,expert_1,,,Fri Dec 20 2024 03:07:16 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-143,A,expert_1,,,Sat Sep 21 2024 20:14:22 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-144,B,expert_49,,,Wed Jan 10 2024 11:41:11 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-144,B,expert_49,,,Thu Sep 19 2024 13:30:57 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-144,B,expert_57,,,Wed May 01 2024 10:41:16 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-144,B,expert_57,,,Wed Feb 07 2024 10:45:19 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-144,B,expert_20,,,Sat Aug 24 2024 21:13:21 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-144,A,expert_20,,,Sat Mar 23 2024 02:54:01 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-144,A,expert_9,,,Mon May 20 2024 15:10:38 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-144,A,expert_9,,,Mon Feb 19 2024 00:29:34 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-144,B,expert_5,,,Sun Aug 04 2024 06:53:49 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-144,B,expert_5,,,Wed Sep 18 2024 19:56:51 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-144,A,expert_8,,,Fri Nov 15 2024 04:28:32 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-144,Tie,expert_8,,,Tue Nov 12 2024 19:39:22 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-144,Tie,author_2,,,Wed Sep 11 2024 03:10:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-144,B,author_2,,,Sun Jan 14 2024 02:35:15 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-144,A,expert_24,,,Sat Jul 27 2024 19:17:46 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-144,B,expert_24,,,Wed Mar 27 2024 04:27:52 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-144,A,author_3,,,Tue Sep 17 2024 21:59:43 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-144,B,author_3,,,Thu Mar 28 2024 21:26:39 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-144,A,expert_26,,,Sat Nov 16 2024 14:59:09 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-144,A,expert_26,,,Sun Jun 23 2024 13:00:19 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-144,A,expert_13,,,Thu Apr 11 2024 15:04:25 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-144,A,expert_13,,,Thu Aug 01 2024 03:26:20 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-144,A,expert_57,,,Wed Sep 11 2024 06:30:24 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-144,A,expert_57,,,Tue Dec 24 2024 07:01:57 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-145,Tie,expert_48,,,Thu Jun 20 2024 04:07:39 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-145,Tie,expert_48,,,Mon Apr 08 2024 21:18:38 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-145,B,expert_24,,,Tue Aug 13 2024 10:30:19 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-145,B,expert_24,,,Tue Sep 10 2024 09:51:00 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-145,B,expert_37,,,Sat Oct 26 2024 04:23:47 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-145,B,expert_37,,,Sun Aug 18 2024 21:02:49 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-145,B,expert_41,,,Tue Sep 17 2024 19:30:39 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-145,B,expert_41,,,Sat Dec 14 2024 19:34:13 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-145,Tie,expert_24,,,Sun Sep 08 2024 03:43:41 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-145,A,expert_24,,,Wed Sep 11 2024 15:26:32 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-145,Tie,author_3,,,Tue Jan 02 2024 19:28:00 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-145,A,author_3,,,Wed Dec 25 2024 03:19:11 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-145,B,expert_27,,,Mon Nov 11 2024 06:23:06 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-145,B,expert_27,,,Fri Jun 28 2024 13:55:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-145,B,expert_3,,,Thu Sep 19 2024 18:03:24 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-145,A,expert_3,,,Fri Apr 19 2024 06:11:52 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-145,B,expert_5,,,Tue Oct 22 2024 15:16:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-145,B,expert_5,,,Mon Feb 26 2024 06:32:08 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-145,Tie,author_6,,,Wed Apr 10 2024 23:12:05 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-145,Tie,author_6,,,Fri Aug 16 2024 01:04:23 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-145,B,expert_22,,,Tue Feb 27 2024 09:43:09 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-145,B,expert_22,,,Mon Jun 17 2024 05:06:34 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-145,B,author_6,,,Sat Sep 14 2024 08:10:40 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-145,B,author_6,,,Fri Jul 26 2024 09:03:51 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-145,B,expert_29,,,Wed Jan 03 2024 14:10:16 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-145,B,expert_29,,,Sun Mar 10 2024 04:46:34 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-145,A,expert_29,,,Sat May 11 2024 19:11:32 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-145,B,expert_29,,,Tue Feb 20 2024 18:02:03 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-145,A,expert_16,,,Wed Aug 21 2024 03:49:31 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-145,A,expert_16,,,Sun Jun 02 2024 13:23:44 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-145,A,author_0,,,Fri Apr 19 2024 01:34:13 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-145,B,author_0,,,Thu Apr 04 2024 11:55:06 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-145,B,expert_1,,,Sun Jul 21 2024 05:52:30 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-145,B,expert_1,,,Sun Jan 21 2024 22:06:13 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-145,B,expert_1,,,Sat Feb 24 2024 00:02:00 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-145,B,expert_1,,,Sun Apr 28 2024 01:34:07 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-146,B,expert_14,,,Thu Sep 19 2024 23:20:56 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-146,A,expert_14,,,Sat Sep 21 2024 01:17:33 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-146,A,author_2,,,Tue Dec 24 2024 19:24:51 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-146,A,author_2,,,Sun Dec 08 2024 01:45:56 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-146,A,author_0,,,Fri Nov 08 2024 02:23:55 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-146,A,author_0,,,Thu Nov 14 2024 08:50:09 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-146,A,author_2,,,Sat Nov 23 2024 17:00:33 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-146,A,author_2,,,Fri Oct 04 2024 14:53:37 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-146,B,author_4,,,Mon Nov 04 2024 04:07:25 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-146,B,author_4,,,Tue Jun 11 2024 06:33:19 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-146,Tie,expert_37,,,Sat Sep 28 2024 06:20:44 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-146,A,expert_37,,,Thu Feb 15 2024 03:35:57 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-146,A,expert_22,,,Sat Jun 01 2024 19:34:43 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-146,A,expert_22,,,Fri May 03 2024 08:06:23 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-146,A,expert_20,,,Sat Oct 26 2024 14:31:00 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-146,A,expert_20,,,Tue Dec 10 2024 13:41:43 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-146,Tie,expert_25,,,Mon Aug 19 2024 21:05:50 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-146,B,expert_46,,,Fri Dec 06 2024 03:56:42 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-146,A,expert_46,,,Fri Oct 11 2024 16:30:22 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-146,A,expert_0,,,Sun Apr 21 2024 02:34:07 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-146,A,expert_0,,,Fri Apr 05 2024 21:58:03 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-146,A,expert_19,,,Fri Apr 19 2024 10:24:08 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-146,Tie,expert_19,,,Sun Jul 28 2024 09:19:02 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-146,B,expert_11,,,Thu Oct 10 2024 23:49:10 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-146,B,expert_11,,,Sun Mar 03 2024 07:20:50 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-146,B,expert_22,,,Mon Nov 11 2024 03:56:07 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-146,B,expert_22,,,Fri Sep 20 2024 16:47:46 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-146,B,expert_38,,,Mon Jun 10 2024 04:01:32 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-146,B,expert_38,,,Mon Feb 19 2024 11:46:11 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-146,B,expert_9,,,Fri Oct 18 2024 02:58:26 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-146,B,expert_9,,,Thu Mar 14 2024 11:30:06 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-146,B,expert_36,,,Thu Mar 21 2024 02:14:18 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-146,B,expert_36,,,Fri Jan 12 2024 08:25:11 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-146,B,author_2,,,Wed May 01 2024 03:30:45 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-146,B,author_2,,,Wed Mar 13 2024 12:36:00 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-146,B,expert_57,,,Wed Nov 20 2024 23:21:18 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-146,B,expert_57,,,Thu Oct 03 2024 08:48:34 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-146,B,expert_11,,,Fri Jan 19 2024 07:55:41 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-146,B,expert_11,,,Fri Sep 27 2024 15:43:16 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-146,B,expert_40,,,Mon Mar 18 2024 21:01:58 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-146,B,expert_40,,,Sat Aug 24 2024 09:27:23 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-146,A,expert_51,,,Sat Dec 07 2024 12:06:37 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-146,A,expert_51,,,Mon Sep 09 2024 19:41:22 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-146,B,expert_23,,,Fri Apr 05 2024 13:21:06 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-146,B,expert_23,,,Sat Feb 10 2024 23:03:43 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-146,B,expert_8,,,Sat Feb 10 2024 12:08:27 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-146,B,expert_8,,,Sat Jun 01 2024 08:39:43 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-146,A,expert_28,,,Tue Oct 15 2024 01:19:25 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-146,A,expert_28,,,Fri Jun 14 2024 00:02:58 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-147,B,expert_14,,,Mon Jan 01 2024 18:46:33 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-147,B,expert_14,,,Wed Jun 19 2024 15:06:31 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-147,B,expert_0,,,Sun Aug 04 2024 05:03:21 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-147,B,expert_0,,,Tue Jul 23 2024 05:24:15 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-147,B,expert_47,,,Wed Sep 25 2024 05:19:12 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-147,B,expert_47,,,Thu Apr 25 2024 11:00:59 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-147,Tie,expert_1,,,Sun Sep 08 2024 07:28:09 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-147,A,expert_1,,,Tue Mar 12 2024 17:41:42 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-147,B,expert_28,,,Thu Feb 15 2024 06:02:29 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-147,B,expert_28,,,Sat Apr 20 2024 02:50:05 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-147,A,expert_5,,,Sat Jan 06 2024 01:32:27 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-147,A,expert_5,,,Mon Jan 15 2024 03:31:42 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-147,A,expert_39,,,Sun Mar 17 2024 00:03:57 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-147,A,expert_39,,,Fri Jan 26 2024 09:45:27 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-147,B,author_3,,,Fri Sep 06 2024 02:11:32 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-147,B,author_3,,,Fri Jul 12 2024 18:55:15 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-147,B,expert_9,,,Sun Apr 14 2024 06:08:25 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-147,B,expert_9,,,Mon Apr 22 2024 19:03:31 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-147,A,expert_1,,,Tue Jan 09 2024 11:35:13 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-147,A,expert_1,,,Sun Jun 16 2024 17:54:04 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-147,A,expert_24,,,Tue Nov 05 2024 16:32:05 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-147,A,expert_24,,,Mon Jun 24 2024 14:23:10 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-147,A,expert_3,,,Fri Apr 26 2024 17:36:02 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-147,A,expert_3,,,Mon Feb 12 2024 16:51:15 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-147,Tie,expert_49,,,Thu Oct 03 2024 20:13:45 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-147,A,expert_49,,,Sun Jul 07 2024 19:09:34 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-147,A,expert_27,,,Thu Feb 22 2024 00:04:16 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-147,A,expert_27,,,Sat Dec 21 2024 02:46:02 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-147,B,expert_49,,,Thu Mar 21 2024 01:42:08 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-147,Tie,expert_49,,,Sat Apr 27 2024 18:08:15 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-147,A,expert_24,,,Mon May 06 2024 21:26:39 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-147,Tie,expert_24,,,Sat Sep 21 2024 17:24:15 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-147,B,expert_26,,,Wed Sep 25 2024 18:05:20 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-147,B,expert_26,,,Tue Sep 10 2024 20:20:08 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-147,Tie,expert_35,,,Wed Dec 25 2024 04:02:49 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-147,B,expert_35,,,Mon Sep 23 2024 17:53:16 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-147,Tie,author_3,,,Wed Mar 13 2024 16:35:52 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-147,B,author_3,,,Wed Jun 19 2024 05:30:33 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-147,B,expert_0,,,Sun Jan 14 2024 02:33:22 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-147,Tie,expert_0,,,Tue Feb 06 2024 08:30:25 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-148,B,expert_14,,,Wed Nov 06 2024 18:23:07 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-148,B,expert_14,,,Fri Mar 15 2024 13:41:13 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-148,B,expert_19,,,Tue Jun 18 2024 09:27:02 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-148,B,expert_19,,,Fri Jan 26 2024 03:51:10 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-148,A,author_6,,,Sun Jul 28 2024 14:36:58 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-148,A,author_6,,,Tue Oct 01 2024 16:43:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-148,Tie,expert_35,,,Sun Apr 07 2024 03:04:40 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-148,Tie,expert_35,,,Fri Feb 02 2024 05:53:45 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-148,A,author_1,,,Wed Feb 28 2024 12:12:31 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-148,B,author_1,,,Fri Feb 09 2024 23:59:54 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-148,A,expert_5,,,Tue Sep 17 2024 10:24:35 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-148,B,expert_5,,,Fri Apr 12 2024 23:30:25 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-148,B,expert_55,,,Tue Apr 16 2024 06:30:00 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-148,B,expert_55,,,Tue Nov 19 2024 15:22:31 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-148,B,expert_56,,,Mon Jul 22 2024 09:00:02 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-148,B,expert_56,,,Sat Dec 07 2024 13:17:07 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-148,A,author_4,,,Sun Sep 08 2024 06:25:15 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-148,A,author_4,,,Sat Jul 27 2024 20:13:52 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-148,A,expert_11,,,Thu Mar 21 2024 16:17:35 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-148,A,expert_11,,,Sat Nov 23 2024 02:42:02 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-148,B,expert_49,,,Sun Jan 21 2024 15:29:28 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-148,A,expert_49,,,Fri Mar 22 2024 19:41:32 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-148,B,expert_54,,,Sat Apr 27 2024 12:24:59 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-148,A,expert_54,,,Thu Jul 11 2024 11:49:29 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-148,A,author_3,,,Sun Sep 22 2024 04:44:54 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-148,A,author_3,,,Fri May 17 2024 10:05:43 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-148,Tie,expert_4,,,Wed Nov 27 2024 18:59:27 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-148,A,expert_4,,,Sun Aug 11 2024 00:39:53 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-148,B,expert_0,,,Wed Oct 02 2024 20:41:59 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-148,A,expert_0,,,Fri Aug 09 2024 14:34:48 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-148,A,expert_12,,,Sat Jun 08 2024 05:52:43 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-148,B,expert_12,,,Thu Oct 03 2024 19:56:20 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-148,A,expert_53,,,Wed Dec 18 2024 18:54:46 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-148,A,expert_53,,,Sun Jul 28 2024 17:53:31 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-148,A,expert_0,,,Sun Sep 22 2024 02:51:40 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-148,B,expert_0,,,Fri Dec 06 2024 18:44:50 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-148,B,author_3,,,Sun May 19 2024 06:30:48 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-148,B,author_3,,,Sun Mar 24 2024 13:46:55 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-148,B,expert_11,,,Tue Nov 12 2024 08:35:07 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-148,B,expert_11,,,Mon Sep 23 2024 17:37:50 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-148,B,expert_14,,,Sat Oct 19 2024 06:49:36 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-148,B,expert_14,,,Tue May 21 2024 14:43:11 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-148,Tie,expert_23,,,Wed Apr 03 2024 02:58:30 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-148,B,expert_23,,,Sun Mar 03 2024 16:49:49 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-148,B,expert_34,,,Thu Jul 25 2024 01:28:20 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-148,B,expert_34,,,Sun Jan 07 2024 07:00:52 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-148,B,expert_14,,,Sun Aug 25 2024 08:27:08 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-148,B,expert_14,,,Wed Sep 04 2024 05:03:22 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-148,A,expert_0,,,Tue Jan 09 2024 01:58:00 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-148,B,expert_0,,,Thu Oct 10 2024 09:57:18 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-148,B,expert_13,,,Wed Dec 18 2024 16:38:56 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-148,B,expert_13,,,Fri Oct 18 2024 06:50:09 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-148,A,expert_45,,,Sun Feb 04 2024 12:05:22 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-148,B,expert_45,,,Fri Apr 05 2024 23:19:05 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-148,Tie,author_0,,,Sun Oct 06 2024 03:44:50 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-148,A,author_0,,,Sun Mar 24 2024 21:14:04 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-149,B,expert_9,,,Sat Feb 03 2024 14:20:13 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-149,B,expert_9,,,Thu Dec 19 2024 06:57:23 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-149,B,author_0,,,Thu Aug 15 2024 03:41:59 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-149,B,author_0,,,Wed Jan 24 2024 06:13:10 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-149,B,expert_6,,,Sun Sep 15 2024 10:35:03 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-149,B,expert_6,,,Sat Aug 17 2024 09:12:08 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-149,B,expert_13,,,Wed Jan 10 2024 03:25:15 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-149,B,expert_13,,,Sat Jul 06 2024 09:39:58 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-149,A,author_3,,,Wed May 15 2024 07:52:22 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-149,A,author_3,,,Tue May 14 2024 12:25:16 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-149,Tie,expert_35,,,Thu Feb 15 2024 18:09:54 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-149,B,expert_35,,,Fri Jul 26 2024 04:22:10 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-149,Tie,expert_47,,,Sun Feb 18 2024 05:26:13 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-149,A,expert_47,,,Fri Nov 08 2024 17:07:38 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-149,A,expert_57,,,Sun May 26 2024 21:12:26 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-149,A,expert_57,,,Tue Feb 20 2024 07:59:56 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-149,A,expert_19,,,Tue Jun 04 2024 12:24:06 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-149,A,expert_19,,,Fri Jul 12 2024 17:25:23 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-149,A,expert_22,,,Sun Jul 28 2024 22:17:31 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-149,A,expert_22,,,Sat Apr 27 2024 00:56:20 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-149,A,expert_47,,,Wed Jun 12 2024 08:09:10 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-149,A,expert_47,,,Sun Mar 03 2024 21:30:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-149,B,expert_23,,,Wed Jan 17 2024 02:18:08 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-149,Tie,expert_23,,,Sun Jun 16 2024 03:17:18 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-149,A,expert_22,,,Mon Oct 21 2024 12:52:24 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-149,B,expert_22,,,Mon Nov 04 2024 01:32:06 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-149,A,expert_24,,,Fri Nov 08 2024 22:06:07 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-149,A,expert_24,,,Sun Dec 22 2024 07:00:07 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-149,A,expert_36,,,Mon Apr 01 2024 14:01:15 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-149,A,expert_36,,,Tue Nov 26 2024 09:55:12 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-149,B,expert_41,,,Wed Oct 09 2024 16:05:20 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-149,B,expert_41,,,Sat Jan 13 2024 03:06:55 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-149,B,author_0,,,Mon Jan 22 2024 08:26:03 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-149,B,author_0,,,Wed Jun 19 2024 01:21:18 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-149,B,author_4,,,Thu Aug 22 2024 14:22:34 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-149,B,author_4,,,Fri Nov 22 2024 20:58:09 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-149,B,expert_25,,,Tue Jul 09 2024 16:09:34 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-149,B,expert_25,,,Sun Aug 11 2024 20:42:02 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-149,B,author_3,,,Sun Jul 07 2024 11:20:41 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-149,Tie,author_3,,,Wed Mar 06 2024 06:20:39 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-149,A,expert_41,,,Wed Mar 06 2024 16:21:39 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-149,A,expert_41,,,Mon Sep 23 2024 05:49:43 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-149,Tie,author_1,,,Tue May 14 2024 20:39:08 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-149,B,author_1,,,Fri Jul 26 2024 07:45:30 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-149,B,expert_3,,,Wed Aug 07 2024 23:18:54 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-149,B,expert_3,,,Wed Jan 03 2024 02:57:47 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-149,A,author_2,,,Thu Sep 05 2024 08:53:47 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-149,A,author_2,,,Sun Nov 03 2024 03:22:20 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-149,A,author_6,,,Thu Sep 26 2024 18:51:08 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-149,A,author_6,,,Thu Jun 06 2024 18:45:14 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-150,B,expert_36,,,Tue Nov 05 2024 14:53:00 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-150,B,expert_36,,,Sat Jan 27 2024 16:17:43 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-150,A,expert_13,,,Thu Apr 18 2024 19:22:03 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-150,A,expert_13,,,Wed Sep 11 2024 15:26:27 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-150,Tie,expert_8,,,Tue Aug 27 2024 05:07:53 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-150,Tie,expert_8,,,Tue Jan 23 2024 15:27:22 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-150,A,expert_20,,,Mon Apr 08 2024 16:21:06 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-150,A,expert_20,,,Fri Jul 19 2024 11:49:34 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-150,A,expert_23,,,Thu Feb 22 2024 14:08:21 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-150,B,expert_23,,,Sat Aug 24 2024 09:52:53 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-150,A,expert_47,,,Sat Apr 13 2024 15:36:05 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-150,Tie,expert_47,,,Sun Mar 10 2024 01:27:15 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-150,A,expert_23,,,Mon Jul 01 2024 21:27:57 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-150,A,expert_23,,,Fri Aug 09 2024 14:11:05 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-150,A,author_0,,,Thu Apr 18 2024 05:15:24 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-150,A,author_0,,,Wed Feb 28 2024 23:09:54 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-150,A,expert_34,,,Sat Jul 20 2024 16:35:55 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-150,A,expert_34,,,Tue Jun 11 2024 02:40:49 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-150,A,expert_57,,,Mon Aug 26 2024 04:47:55 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-150,A,expert_57,,,Thu Jan 18 2024 11:56:27 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-150,A,expert_12,,,Wed Apr 17 2024 02:51:20 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-150,Tie,expert_12,,,Tue Oct 22 2024 22:52:01 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-150,A,author_2,,,Sat Jun 01 2024 02:22:02 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-150,A,author_2,,,Sun Feb 25 2024 10:08:05 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-150,B,expert_28,,,Sun Jul 28 2024 17:39:26 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-150,B,expert_28,,,Fri Oct 25 2024 03:14:15 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-150,B,expert_50,,,Tue Jan 16 2024 00:15:39 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-150,B,expert_50,,,Sun Mar 10 2024 21:39:17 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-150,A,expert_57,,,Sun Apr 07 2024 22:01:16 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-150,A,expert_57,,,Sun Oct 13 2024 19:13:55 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-150,A,author_0,,,Tue Jul 09 2024 22:46:11 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-150,A,author_0,,,Wed Aug 28 2024 16:27:26 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-150,A,author_4,,,Wed Feb 14 2024 20:10:08 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-150,B,author_4,,,Sun Jan 28 2024 01:50:59 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-150,B,expert_24,,,Sun Oct 06 2024 04:35:06 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-150,A,expert_24,,,Mon Oct 28 2024 07:30:13 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-150,B,expert_21,,,Mon Apr 01 2024 14:02:00 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-150,B,expert_21,,,Sun Jul 14 2024 23:01:58 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-150,B,expert_38,,,Tue Mar 19 2024 00:43:26 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-150,B,expert_38,,,Sat Jan 06 2024 06:16:37 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-151,B,expert_34,,,Tue Oct 15 2024 08:11:15 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-151,B,expert_34,,,Thu Jan 25 2024 01:04:56 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-151,B,author_0,,,Wed Aug 21 2024 16:56:30 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-151,B,author_0,,,Tue Mar 12 2024 14:41:54 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-151,Tie,author_0,,,Sun Oct 20 2024 17:37:38 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-151,B,author_0,,,Mon Oct 28 2024 03:43:35 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-151,B,expert_55,,,Sat Jul 27 2024 14:21:06 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-151,A,expert_55,,,Sat Dec 21 2024 16:47:27 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-151,B,expert_9,,,Sat Apr 27 2024 02:18:24 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-151,B,expert_9,,,Sun Feb 25 2024 00:37:15 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-151,A,author_5,,,Sat Jun 22 2024 10:06:16 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-151,A,author_5,,,Wed Dec 04 2024 20:51:58 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-151,A,expert_21,,,Sat Jun 15 2024 02:07:03 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-151,A,expert_21,,,Sun Mar 03 2024 07:14:03 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-151,A,expert_17,,,Sun Jan 14 2024 08:51:55 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-151,B,expert_17,,,Thu Dec 19 2024 12:11:53 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-151,B,expert_26,,,Thu Jan 18 2024 18:04:00 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-151,A,expert_26,,,Fri Oct 18 2024 23:37:32 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-151,A,author_6,,,Sun Feb 18 2024 11:13:50 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-151,A,author_6,,,Sun Apr 07 2024 14:05:41 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-151,A,author_2,,,Fri Dec 13 2024 22:14:29 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-151,B,author_2,,,Wed Jan 17 2024 08:23:21 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-151,B,author_2,,,Wed Jun 05 2024 07:21:19 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-151,B,author_2,,,Fri Sep 20 2024 08:12:40 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-151,B,expert_24,,,Wed Nov 27 2024 19:05:26 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-151,B,expert_24,,,Sun Aug 04 2024 12:01:09 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-151,B,expert_38,,,Thu Sep 26 2024 16:08:09 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-151,B,expert_38,,,Sat Mar 23 2024 07:58:35 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-151,B,expert_4,,,Wed Dec 11 2024 22:15:04 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-151,B,expert_4,,,Sat Nov 09 2024 06:17:53 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-151,B,expert_46,,,Thu Apr 11 2024 12:16:42 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-151,B,expert_46,,,Fri Dec 27 2024 11:16:40 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-151,B,author_2,,,Sun Aug 04 2024 15:44:26 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-151,B,author_2,,,Tue Aug 06 2024 01:48:13 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-151,A,author_2,,,Wed Jun 19 2024 23:48:44 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-151,B,author_2,,,Mon Jul 22 2024 20:21:41 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-151,A,expert_15,,,Wed Apr 10 2024 00:27:50 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-151,A,expert_15,,,Mon May 13 2024 10:06:24 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-151,A,expert_6,,,Sat May 18 2024 03:30:02 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-151,A,expert_6,,,Tue Sep 10 2024 18:59:53 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-152,B,expert_9,,,Tue Mar 26 2024 18:57:28 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-152,B,expert_9,,,Fri Jul 26 2024 10:03:34 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-152,Tie,author_6,,,Thu Apr 04 2024 15:41:28 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-152,Tie,author_6,,,Thu Mar 21 2024 06:23:30 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-152,A,expert_47,,,Sat Dec 07 2024 12:28:09 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-152,A,expert_47,,,Sun Feb 18 2024 13:16:30 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-152,A,expert_5,,,Mon Feb 12 2024 09:33:50 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-152,A,expert_5,,,Fri Nov 22 2024 21:20:02 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-152,A,author_3,,,Wed Jun 12 2024 15:15:54 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-152,A,author_3,,,Mon Jan 01 2024 07:50:21 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-152,A,expert_12,,,Sun Feb 04 2024 02:54:21 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-152,A,expert_12,,,Sat Nov 09 2024 08:41:28 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-152,A,expert_38,,,Sun Dec 15 2024 00:37:21 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-152,A,expert_38,,,Sat Nov 09 2024 11:21:48 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-152,A,expert_48,,,Sat Jan 27 2024 07:04:35 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-152,A,expert_48,,,Wed Mar 13 2024 20:40:09 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-152,Tie,author_6,,,Sun Feb 25 2024 17:56:35 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-152,Tie,author_6,,,Fri Dec 20 2024 16:54:04 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-152,B,author_4,,,Sat Aug 03 2024 07:32:45 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-152,Tie,author_4,,,Tue Feb 27 2024 09:53:06 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-152,B,expert_56,,,Wed Feb 28 2024 17:21:21 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-152,B,expert_56,,,Tue Jan 09 2024 09:37:34 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-152,A,expert_57,,,Tue Mar 12 2024 01:14:37 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-152,A,expert_57,,,Mon Jun 10 2024 17:20:52 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-152,A,expert_31,,,Tue Mar 19 2024 06:12:57 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-152,Tie,expert_31,,,Wed Feb 28 2024 18:32:59 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-152,Tie,author_3,,,Fri Nov 08 2024 06:39:32 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-152,B,author_3,,,Mon Feb 05 2024 05:59:34 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-152,A,expert_28,,,Wed Jul 24 2024 17:55:18 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-152,A,expert_28,,,Mon May 27 2024 06:10:20 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-152,A,expert_0,,,Fri Jul 12 2024 04:06:38 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-152,Tie,expert_0,,,Fri Mar 08 2024 19:52:22 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-152,B,expert_43,,,Sat Sep 28 2024 04:47:42 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-152,B,expert_43,,,Tue Oct 01 2024 13:05:35 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-152,B,expert_55,,,Sun Apr 07 2024 01:45:42 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-152,B,expert_55,,,Tue Mar 19 2024 02:04:01 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-152,B,author_0,,,Wed Aug 14 2024 16:35:42 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-152,B,author_0,,,Sun Dec 08 2024 01:09:12 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-152,B,author_6,,,Mon Jan 08 2024 11:03:07 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-152,B,author_6,,,Wed May 22 2024 13:10:09 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-152,B,expert_39,,,Wed Dec 04 2024 23:43:42 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-152,B,expert_39,,,Sat Jan 13 2024 08:42:00 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-152,B,expert_34,,,Fri Jun 07 2024 11:28:23 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-152,B,expert_34,,,Thu Aug 08 2024 02:00:08 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-152,A,expert_44,,,Thu Apr 11 2024 18:49:57 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-152,B,expert_44,,,Wed Jan 17 2024 20:22:39 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-152,A,expert_56,,,Fri May 03 2024 13:55:43 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-152,A,expert_56,,,Thu Oct 03 2024 02:33:42 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-152,A,expert_7,,,Mon Oct 14 2024 02:45:27 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-152,A,expert_7,,,Tue Jun 04 2024 01:41:07 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-152,B,author_4,,,Fri Dec 27 2024 08:15:13 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-152,Tie,author_4,,,Fri Dec 13 2024 01:56:00 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-152,A,expert_34,,,Fri Nov 15 2024 17:02:10 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-152,B,expert_34,,,Sun Oct 27 2024 05:19:02 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-153,B,expert_47,,,Tue Jul 09 2024 04:30:11 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-153,B,expert_47,,,Thu Feb 01 2024 19:05:32 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-153,Tie,expert_2,,,Sat Jan 13 2024 12:12:05 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-153,B,expert_2,,,Tue Mar 19 2024 10:46:08 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-153,B,expert_27,,,Thu May 23 2024 02:45:26 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-153,B,expert_27,,,Sun Mar 10 2024 02:32:28 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-153,B,expert_32,,,Wed Oct 16 2024 22:49:56 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-153,B,expert_32,,,Sun Feb 11 2024 07:43:03 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-153,B,author_4,,,Wed Aug 14 2024 05:16:34 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-153,Tie,author_4,,,Wed Nov 13 2024 20:22:54 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-153,B,expert_16,,,Thu Jun 20 2024 11:59:46 GMT-0400 (Eastern Daylight Time)
claude-v1,vicuna-13b-v1.2,false,mtbench-153,B,expert_16,,,Thu Apr 25 2024 13:47:06 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-153,A,author_0,,,Sat Feb 10 2024 20:43:35 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-153,A,author_0,,,Sat Sep 07 2024 00:31:03 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-153,A,expert_30,,,Sun Jun 23 2024 19:26:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-153,A,expert_30,,,Fri Sep 20 2024 23:33:36 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-153,B,expert_32,,,Sun Oct 13 2024 03:55:55 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-153,B,expert_32,,,Tue Apr 16 2024 13:17:33 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-153,Tie,author_0,,,Sun Apr 14 2024 13:44:06 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-153,A,author_0,,,Fri May 03 2024 05:13:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-153,A,expert_43,,,Thu Jun 20 2024 22:31:09 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-153,A,expert_43,,,Mon Jan 15 2024 07:33:28 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-153,A,expert_46,,,Wed Oct 23 2024 06:51:02 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-153,A,expert_46,,,Sat Feb 17 2024 02:05:20 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-153,A,expert_34,,,Tue Oct 01 2024 08:22:35 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-153,A,expert_34,,,Fri Dec 27 2024 13:33:53 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-153,A,expert_10,,,Fri Apr 19 2024 11:41:30 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-153,A,expert_10,,,Sun Feb 18 2024 08:37:23 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-153,B,author_3,,,Thu Oct 24 2024 12:22:19 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-153,B,author_3,,,Wed Oct 02 2024 01:43:29 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-153,A,expert_46,,,Wed Mar 06 2024 22:05:28 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-153,A,expert_46,,,Sat Oct 26 2024 21:52:19 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-153,A,expert_1,,,Fri Mar 01 2024 06:03:52 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-153,Tie,expert_1,,,Wed Dec 18 2024 08:04:42 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-153,A,expert_9,,,Thu Oct 24 2024 03:42:36 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-153,A,expert_9,,,Thu Nov 28 2024 17:56:23 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-153,Tie,author_4,,,Thu Nov 28 2024 05:08:25 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-153,Tie,author_4,,,Sun Dec 08 2024 00:52:26 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-153,Tie,expert_25,,,Fri Feb 02 2024 08:32:11 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-153,Tie,expert_25,,,Wed May 22 2024 10:04:39 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-153,B,expert_19,,,Sat Apr 06 2024 06:06:38 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-153,B,expert_19,,,Wed Apr 17 2024 00:24:07 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-154,B,expert_26,,,Sat May 25 2024 10:38:03 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-154,B,expert_26,,,Wed Apr 24 2024 17:40:21 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-154,B,expert_51,,,Sat Jul 13 2024 14:06:24 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-154,B,expert_51,,,Sun May 12 2024 04:02:51 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-154,B,expert_33,,,Sun May 05 2024 01:52:32 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-154,Tie,expert_33,,,Fri Sep 27 2024 12:58:42 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-154,A,expert_27,,,Wed Apr 17 2024 03:13:56 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-154,A,expert_27,,,Thu Jul 11 2024 02:33:22 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-154,Tie,author_5,,,Fri Mar 01 2024 00:21:37 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-154,Tie,author_5,,,Mon Sep 02 2024 17:04:05 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-154,A,expert_53,,,Sat Aug 10 2024 06:54:37 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-154,A,expert_53,,,Tue Jun 11 2024 04:06:32 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-154,A,expert_24,,,Mon Jul 08 2024 19:40:29 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-154,A,expert_24,,,Tue Nov 26 2024 03:43:41 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-154,A,author_4,,,Thu Apr 11 2024 12:00:31 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-154,Tie,author_4,,,Tue Jan 16 2024 21:31:30 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-154,A,expert_17,,,Sun Jun 02 2024 18:13:54 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-154,B,expert_17,,,Wed May 08 2024 03:58:52 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-154,A,expert_46,,,Sun Oct 06 2024 21:21:24 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-154,A,expert_46,,,Sat Jun 01 2024 18:45:04 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-154,A,expert_7,,,Fri May 17 2024 08:55:22 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-154,A,expert_7,,,Fri Jul 12 2024 00:53:47 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-154,B,expert_16,,,Wed Aug 14 2024 13:05:46 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-154,B,expert_16,,,Fri Oct 18 2024 23:52:27 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-154,Tie,author_4,,,Sun Feb 11 2024 14:20:48 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-154,B,author_4,,,Sat Aug 17 2024 20:24:45 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-154,A,expert_18,,,Sun Feb 25 2024 22:17:09 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-154,A,expert_18,,,Mon Jun 24 2024 22:13:28 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-154,A,expert_52,,,Sat Apr 27 2024 00:24:10 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-154,A,expert_52,,,Mon Apr 01 2024 19:02:40 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-154,A,expert_9,,,Wed Apr 10 2024 08:22:01 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-154,A,expert_9,,,Wed Jul 03 2024 12:05:39 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-155,Tie,author_0,,,Fri Jan 12 2024 02:17:06 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-155,Tie,author_0,,,Thu Apr 04 2024 03:45:46 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-155,B,expert_17,,,Tue Mar 19 2024 00:30:46 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-155,B,expert_17,,,Fri May 03 2024 02:50:50 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-155,Tie,expert_27,,,Sat Aug 03 2024 06:06:13 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-155,B,expert_27,,,Mon May 27 2024 17:41:42 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-155,Tie,expert_24,,,Wed Jul 24 2024 04:55:04 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-155,Tie,expert_24,,,Tue Mar 19 2024 04:42:42 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-155,A,expert_15,,,Fri Sep 13 2024 13:37:59 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-4,false,mtbench-155,A,expert_15,,,Fri Dec 06 2024 06:13:29 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-155,A,expert_45,,,Sat Oct 05 2024 23:04:30 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-155,A,expert_45,,,Tue Feb 27 2024 16:06:20 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-155,A,expert_0,,,Wed Oct 09 2024 13:19:03 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-155,A,expert_0,,,Thu Aug 22 2024 06:33:11 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-155,A,expert_45,,,Sat Jan 20 2024 20:32:51 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-155,A,expert_45,,,Thu Oct 17 2024 03:02:52 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-155,Tie,author_5,,,Sat Feb 10 2024 02:48:08 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-155,B,author_5,,,Mon Sep 23 2024 10:21:16 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-155,A,expert_40,,,Sun Dec 01 2024 09:43:41 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-155,B,expert_40,,,Fri Feb 09 2024 12:22:12 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-155,B,author_4,,,Mon Jan 15 2024 17:54:23 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-155,A,author_4,,,Tue Mar 05 2024 21:07:43 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-155,A,expert_43,,,Sat Aug 24 2024 23:51:16 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-155,A,expert_43,,,Sat Jun 22 2024 03:58:55 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-155,A,expert_48,,,Sun Dec 22 2024 06:36:10 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-155,A,expert_48,,,Wed Oct 09 2024 08:04:18 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-155,B,expert_23,,,Fri Apr 12 2024 07:07:13 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-155,B,expert_23,,,Wed May 15 2024 10:26:27 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-155,B,expert_31,,,Sun Sep 15 2024 16:47:23 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-155,B,expert_31,,,Tue Dec 24 2024 17:34:28 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-155,B,author_0,,,Wed Sep 04 2024 08:32:03 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-155,Tie,author_0,,,Mon Dec 16 2024 21:01:37 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-155,B,expert_20,,,Sun Feb 11 2024 10:40:50 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-155,B,expert_20,,,Mon Oct 21 2024 21:57:46 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-155,B,expert_0,,,Fri Jun 07 2024 02:11:05 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-155,B,expert_0,,,Sun Jun 09 2024 07:41:35 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-155,B,expert_37,,,Wed Jan 03 2024 09:26:00 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-155,B,expert_37,,,Mon Jan 01 2024 20:45:24 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-155,A,expert_27,,,Fri Dec 13 2024 20:58:12 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-155,B,expert_27,,,Sat Jul 06 2024 02:08:39 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-155,A,expert_40,,,Sat Apr 20 2024 14:17:06 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-155,B,expert_40,,,Sun Oct 13 2024 06:22:40 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-155,B,expert_43,,,Mon Jan 08 2024 08:23:06 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-155,B,expert_43,,,Sat Jun 08 2024 08:10:42 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-155,A,expert_21,,,Thu Mar 21 2024 08:00:59 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-155,B,expert_21,,,Sat Jan 06 2024 05:00:03 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-155,Tie,expert_24,,,Mon Oct 07 2024 00:05:25 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-155,B,expert_24,,,Mon Jan 15 2024 19:21:27 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-155,B,expert_6,,,Mon May 27 2024 03:28:03 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-155,A,expert_6,,,Wed Jun 19 2024 09:02:52 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-155,Tie,expert_7,,,Mon Oct 21 2024 03:45:17 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-155,B,expert_7,,,Sun Feb 18 2024 01:14:58 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-155,B,expert_47,,,Fri Mar 15 2024 00:33:19 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-155,B,expert_47,,,Tue Dec 17 2024 07:36:05 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-156,Tie,author_4,,,Fri Aug 23 2024 22:05:48 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-156,Tie,author_4,,,Sat Sep 14 2024 07:30:49 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-156,B,expert_46,,,Sat Jul 06 2024 17:05:13 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-156,B,expert_46,,,Tue Feb 13 2024 19:54:59 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-156,Tie,author_3,,,Sun Nov 10 2024 11:26:06 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-156,B,author_3,,,Mon May 06 2024 16:18:14 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-156,A,author_5,,,Sat Sep 07 2024 16:11:51 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-156,A,expert_37,,,Thu Aug 22 2024 16:49:22 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-156,A,expert_37,,,Sun Apr 14 2024 08:00:02 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-156,Tie,expert_47,,,Fri Aug 23 2024 17:19:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-156,A,expert_47,,,Sat Aug 24 2024 11:04:48 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-156,B,expert_19,,,Sun May 26 2024 17:32:36 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-156,B,expert_19,,,Mon Jul 22 2024 13:04:30 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-156,Tie,expert_24,,,Sat Aug 10 2024 15:18:05 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-156,B,expert_24,,,Sat Feb 03 2024 00:33:02 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-156,A,expert_53,,,Tue Sep 10 2024 20:18:52 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-156,B,expert_53,,,Sat May 04 2024 08:36:43 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-156,A,expert_20,,,Mon Feb 19 2024 06:22:52 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-156,A,expert_20,,,Thu Sep 26 2024 18:44:39 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-156,B,expert_16,,,Tue Aug 20 2024 21:54:16 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-156,B,expert_16,,,Fri Mar 15 2024 08:31:53 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-156,A,expert_53,,,Mon Feb 19 2024 12:15:21 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-156,B,expert_53,,,Tue Nov 05 2024 20:37:41 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-156,B,expert_19,,,Wed Sep 11 2024 10:37:58 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-156,B,expert_19,,,Mon Feb 05 2024 07:16:05 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-156,B,expert_44,,,Fri Jan 05 2024 04:11:45 GMT-0400 (Eastern Daylight Time)
llama-13b,claude-v1,false,mtbench-156,B,expert_44,,,Tue Sep 03 2024 14:03:37 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-156,B,expert_7,,,Wed Jan 24 2024 05:52:58 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-156,B,expert_7,,,Sat May 25 2024 02:35:25 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-156,A,expert_0,,,Wed Nov 06 2024 10:36:33 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-156,A,expert_0,,,Tue Jun 25 2024 14:19:27 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-156,Tie,expert_13,,,Sat Feb 03 2024 15:34:33 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,alpaca-13b,false,mtbench-156,A,expert_13,,,Tue Jan 23 2024 09:41:04 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-156,B,expert_13,,,Sat Nov 02 2024 18:34:27 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-156,B,expert_13,,,Fri May 10 2024 18:34:28 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-156,A,author_0,,,Thu Mar 07 2024 15:35:41 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-156,A,author_0,,,Wed Jan 24 2024 22:51:03 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-156,B,expert_13,,,Sat Oct 19 2024 03:06:57 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-156,Tie,expert_5,,,Sun Aug 25 2024 19:25:50 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-156,B,expert_5,,,Thu Jan 04 2024 08:22:00 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-157,B,expert_21,,,Sun Aug 25 2024 07:24:08 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-157,B,expert_21,,,Tue Apr 09 2024 07:32:04 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-157,B,author_4,,,Thu Feb 08 2024 15:42:46 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-157,B,author_4,,,Mon Dec 02 2024 21:58:31 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-157,B,expert_25,,,Sat Mar 09 2024 12:14:11 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-157,B,expert_25,,,Thu Nov 21 2024 22:26:03 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-157,Tie,author_2,,,Sun Aug 25 2024 17:15:42 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-157,A,author_2,,,Thu Apr 25 2024 23:40:13 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-157,Tie,expert_35,,,Mon Dec 02 2024 23:08:15 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-157,Tie,expert_35,,,Thu Sep 12 2024 11:03:22 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-157,Tie,author_2,,,Tue Dec 17 2024 03:31:08 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-157,Tie,author_2,,,Sat Apr 13 2024 10:04:03 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-157,A,author_4,,,Tue Aug 06 2024 14:35:40 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-157,A,author_4,,,Sat Jul 13 2024 05:25:35 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-157,A,expert_36,,,Sat Jul 13 2024 15:47:48 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-157,A,expert_36,,,Sun Mar 10 2024 01:30:19 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-157,B,expert_43,,,Fri Oct 04 2024 17:30:24 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-157,A,expert_43,,,Thu Jun 13 2024 19:06:32 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-157,Tie,expert_9,,,Wed Dec 04 2024 09:58:09 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-157,A,expert_9,,,Sat Mar 02 2024 09:04:47 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-157,A,expert_17,,,Sat Aug 17 2024 20:09:02 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-157,A,expert_17,,,Tue Aug 13 2024 17:06:50 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-157,A,expert_7,,,Thu Nov 14 2024 05:22:00 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-157,B,expert_7,,,Sun Jul 07 2024 10:12:08 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-157,Tie,author_4,,,Sun Jan 07 2024 20:04:53 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-157,A,author_4,,,Wed Jun 05 2024 10:35:00 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-157,A,expert_39,,,Sat Dec 14 2024 13:41:34 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-157,B,expert_39,,,Tue Mar 05 2024 06:13:11 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-157,Tie,expert_35,,,Thu Mar 07 2024 03:44:06 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-157,Tie,expert_35,,,Sun Mar 24 2024 11:18:06 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-157,B,expert_5,,,Mon Nov 25 2024 01:23:38 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-157,A,expert_5,,,Wed Feb 07 2024 17:59:02 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-157,A,expert_56,,,Sat Feb 03 2024 12:15:27 GMT-0400 (Eastern Daylight Time)
gpt-4,alpaca-13b,false,mtbench-157,A,expert_56,,,Fri Feb 23 2024 11:21:10 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-157,Tie,expert_9,,,Mon Mar 25 2024 10:46:24 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-157,A,expert_9,,,Tue Aug 06 2024 06:22:31 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-157,Tie,expert_45,,,Tue Jun 04 2024 02:35:09 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-157,A,expert_45,,,Sat Nov 02 2024 12:53:07 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-157,A,expert_34,,,Wed Jul 03 2024 09:55:35 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-157,B,expert_34,,,Sat Mar 16 2024 10:58:12 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-157,A,expert_46,,,Sat Nov 09 2024 20:47:54 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-157,B,expert_46,,,Thu May 16 2024 09:11:06 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-158,B,author_3,,,Sat Apr 13 2024 06:58:13 GMT-0400 (Eastern Daylight Time)
alpaca-13b,claude-v1,false,mtbench-158,B,author_3,,,Sat May 11 2024 13:31:25 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-158,Tie,author_0,,,Tue Feb 13 2024 20:53:21 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-158,B,author_0,,,Mon Jan 01 2024 00:52:53 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-158,B,expert_15,,,Sun Dec 22 2024 20:42:08 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-158,B,expert_15,,,Wed Dec 11 2024 15:18:24 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-158,A,expert_37,,,Sun May 12 2024 16:32:05 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-158,A,expert_37,,,Fri Dec 27 2024 23:03:03 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-158,B,expert_48,,,Wed Aug 28 2024 22:31:50 GMT-0400 (Eastern Daylight Time)
alpaca-13b,llama-13b,false,mtbench-158,A,expert_48,,,Wed Jun 12 2024 04:27:14 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-158,A,expert_40,,,Tue May 07 2024 20:54:03 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-158,B,expert_40,,,Mon Aug 12 2024 14:29:28 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-158,A,expert_56,,,Wed Aug 07 2024 06:40:06 GMT-0400 (Eastern Daylight Time)
claude-v1,gpt-3.5-turbo,false,mtbench-158,B,expert_56,,,Sun May 05 2024 18:45:00 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-158,A,author_4,,,Mon Mar 04 2024 16:41:14 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-158,A,author_4,,,Sat Apr 06 2024 12:54:05 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-158,B,author_4,,,Sat Dec 21 2024 17:03:07 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-158,B,author_4,,,Sun May 12 2024 04:41:34 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-158,A,expert_8,,,Fri Sep 13 2024 12:21:46 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-158,A,expert_8,,,Wed Feb 28 2024 14:40:19 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-158,A,author_0,,,Sun Mar 17 2024 15:58:33 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-158,Tie,author_0,,,Sat May 18 2024 03:46:10 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-158,A,expert_36,,,Mon Aug 12 2024 10:58:54 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-158,A,expert_36,,,Thu Dec 05 2024 12:30:54 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-158,A,expert_54,,,Fri Feb 16 2024 07:22:34 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-158,A,expert_54,,,Wed Jul 24 2024 17:15:03 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-158,B,expert_0,,,Mon Dec 02 2024 04:53:08 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-158,B,expert_0,,,Mon Feb 05 2024 11:28:45 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-158,B,expert_14,,,Tue Aug 27 2024 08:00:27 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-158,B,expert_14,,,Fri Jan 19 2024 12:14:59 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-158,B,expert_27,,,Mon Nov 25 2024 14:38:09 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-158,B,expert_27,,,Fri Aug 16 2024 10:40:45 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-158,Tie,author_5,,,Fri Oct 18 2024 00:51:26 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-158,A,author_5,,,Wed Jan 17 2024 22:55:28 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-158,A,expert_37,,,Sun Dec 22 2024 07:56:52 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-158,A,expert_37,,,Mon Jun 17 2024 13:40:52 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-159,B,expert_24,,,Sat Jan 06 2024 15:17:08 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-159,B,expert_24,,,Sun Feb 18 2024 17:18:36 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-159,B,expert_25,,,Fri Oct 18 2024 06:35:30 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-159,B,expert_25,,,Sun Aug 18 2024 08:09:46 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-159,B,expert_40,,,Thu Feb 15 2024 21:46:58 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-4,false,mtbench-159,B,expert_40,,,Fri Apr 12 2024 16:55:46 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-159,B,expert_2,,,Wed Sep 04 2024 01:46:30 GMT-0400 (Eastern Daylight Time)
alpaca-13b,vicuna-13b-v1.2,false,mtbench-159,B,expert_2,,,Tue May 14 2024 21:19:48 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-159,A,expert_8,,,Mon Dec 02 2024 02:39:53 GMT-0400 (Eastern Daylight Time)
claude-v1,alpaca-13b,false,mtbench-159,A,expert_8,,,Sun Nov 03 2024 23:14:03 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-159,A,author_0,,,Sat Jan 27 2024 03:34:00 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-159,Tie,author_0,,,Wed Aug 21 2024 13:02:47 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-159,A,expert_15,,,Sun Oct 20 2024 09:23:48 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-159,A,expert_15,,,Thu Jul 04 2024 03:56:57 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-159,B,author_0,,,Tue Jan 09 2024 22:45:28 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-159,Tie,author_0,,,Mon Sep 16 2024 22:24:16 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-159,B,expert_43,,,Mon Dec 02 2024 15:31:18 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-159,A,expert_43,,,Fri Jul 19 2024 22:00:43 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-159,B,expert_20,,,Thu Jan 25 2024 05:53:19 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-159,A,expert_20,,,Wed Nov 13 2024 23:36:04 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-159,A,author_0,,,Tue Jun 25 2024 18:41:41 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-159,A,author_0,,,Mon Aug 26 2024 22:33:53 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-159,A,expert_5,,,Fri Oct 04 2024 03:27:50 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-159,A,expert_5,,,Wed Jul 24 2024 13:26:33 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-159,A,expert_55,,,Mon Jul 22 2024 17:58:04 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-159,A,expert_55,,,Thu Mar 28 2024 20:54:25 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-159,Tie,expert_9,,,Tue Aug 20 2024 03:33:21 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,llama-13b,false,mtbench-159,A,expert_9,,,Wed Feb 14 2024 13:44:48 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-159,Tie,author_0,,,Wed Jun 26 2024 07:04:07 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-159,B,author_0,,,Mon Jun 17 2024 18:33:42 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-159,Tie,expert_28,,,Tue Mar 05 2024 02:48:34 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-159,A,expert_28,,,Wed Nov 20 2024 13:36:42 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-159,A,expert_40,,,Sat May 04 2024 06:16:14 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-159,A,expert_40,,,Sun Jan 28 2024 20:18:39 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-159,Tie,expert_49,,,Fri Aug 16 2024 22:06:44 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-159,A,expert_49,,,Wed Jan 17 2024 15:03:18 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-159,Tie,expert_25,,,Thu Feb 08 2024 03:27:38 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-159,A,expert_25,,,Sat Jun 01 2024 17:59:01 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-159,A,expert_40,,,Sat Apr 20 2024 23:45:14 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-159,B,expert_40,,,Wed Jan 03 2024 04:47:31 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-159,A,expert_15,,,Tue Sep 24 2024 06:27:32 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-159,A,expert_15,,,Tue Dec 24 2024 10:13:13 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-159,A,expert_53,,,Thu Jan 11 2024 15:16:12 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-159,A,expert_53,,,Tue Oct 15 2024 00:51:59 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-159,B,expert_44,,,Sat Sep 21 2024 02:56:04 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-159,B,expert_44,,,Wed Oct 16 2024 13:42:14 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-159,B,expert_14,,,Tue Sep 17 2024 23:33:47 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-159,B,expert_14,,,Thu May 16 2024 10:00:50 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-159,B,expert_16,,,Wed May 22 2024 07:02:19 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-4,false,mtbench-159,B,expert_16,,,Thu Jun 13 2024 06:36:50 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-159,B,expert_4,,,Tue Aug 06 2024 05:01:57 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-159,B,expert_4,,,Sun Apr 07 2024 18:46:14 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-159,Tie,expert_19,,,Thu Jun 13 2024 06:42:43 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-159,A,expert_19,,,Fri Dec 27 2024 03:39:15 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-159,B,expert_21,,,Fri Nov 15 2024 10:34:46 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-159,A,expert_21,,,Mon Nov 25 2024 22:54:18 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-159,B,expert_4,,,Wed Aug 21 2024 07:51:46 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-159,A,expert_4,,,Mon Jun 03 2024 16:22:21 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-159,Tie,expert_24,,,Mon Sep 09 2024 06:27:56 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-159,Tie,expert_24,,,Thu Feb 22 2024 02:56:08 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-159,A,expert_47,,,Sun Feb 11 2024 03:47:51 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-4,false,mtbench-159,B,expert_47,,,Mon Mar 11 2024 03:02:00 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-160,Tie,expert_17,,,Sat Sep 28 2024 07:17:35 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-160,B,expert_17,,,Thu Jun 27 2024 11:31:58 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-160,Tie,expert_24,,,Sat May 25 2024 18:21:26 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-160,Tie,expert_24,,,Wed Dec 18 2024 00:00:27 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-160,B,expert_32,,,Sat Apr 20 2024 02:00:26 GMT-0400 (Eastern Daylight Time)
alpaca-13b,gpt-3.5-turbo,false,mtbench-160,B,expert_32,,,Wed Jun 05 2024 09:12:00 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-160,Tie,expert_47,,,Tue Jan 09 2024 22:56:44 GMT-0400 (Eastern Daylight Time)
claude-v1,llama-13b,false,mtbench-160,A,expert_47,,,Mon Jan 01 2024 18:32:26 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-160,A,expert_0,,,Mon Dec 02 2024 19:45:07 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-160,A,expert_0,,,Mon Aug 12 2024 11:00:14 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-160,A,expert_37,,,Sat Sep 14 2024 00:13:49 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-160,A,expert_37,,,Sat May 25 2024 06:48:07 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-160,A,expert_49,,,Fri Oct 04 2024 18:28:52 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,alpaca-13b,false,mtbench-160,A,expert_49,,,Tue Nov 19 2024 19:41:12 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-160,Tie,expert_24,,,Tue May 21 2024 02:33:47 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,claude-v1,false,mtbench-160,B,expert_24,,,Tue Jun 11 2024 11:54:08 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-160,B,expert_34,,,Tue Sep 17 2024 12:31:29 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,gpt-4,false,mtbench-160,B,expert_34,,,Wed Feb 28 2024 15:45:28 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-160,Tie,author_0,,,Fri Sep 27 2024 00:40:38 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-160,A,author_0,,,Fri Nov 08 2024 08:19:57 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-160,B,expert_19,,,Tue Jul 09 2024 17:39:57 GMT-0400 (Eastern Daylight Time)
gpt-3.5-turbo,vicuna-13b-v1.2,false,mtbench-160,Tie,expert_19,,,Tue Apr 16 2024 18:34:41 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-160,Tie,expert_9,,,Tue Apr 23 2024 09:31:10 GMT-0400 (Eastern Daylight Time)
gpt-4,claude-v1,false,mtbench-160,Tie,expert_9,,,Thu Jan 11 2024 19:36:09 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-160,Tie,expert_47,,,Wed Dec 25 2024 14:53:23 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-160,Tie,expert_47,,,Sun Aug 18 2024 05:49:45 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-160,A,expert_7,,,Mon Apr 01 2024 14:19:40 GMT-0400 (Eastern Daylight Time)
gpt-4,gpt-3.5-turbo,false,mtbench-160,A,expert_7,,,Sat Oct 26 2024 19:25:40 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-160,A,expert_3,,,Mon Mar 25 2024 22:21:56 GMT-0400 (Eastern Daylight Time)
gpt-4,llama-13b,false,mtbench-160,A,expert_3,,,Thu Apr 18 2024 13:25:37 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-160,Tie,expert_9,,,Mon Apr 01 2024 12:48:52 GMT-0400 (Eastern Daylight Time)
gpt-4,vicuna-13b-v1.2,false,mtbench-160,Tie,expert_9,,,Thu May 23 2024 23:30:44 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-160,A,expert_0,,,Thu Jul 04 2024 00:34:02 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-160,B,expert_0,,,Sun May 12 2024 16:27:25 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-160,A,expert_22,,,Fri Mar 01 2024 21:34:59 GMT-0400 (Eastern Daylight Time)
llama-13b,alpaca-13b,false,mtbench-160,A,expert_22,,,Tue Jan 23 2024 20:44:58 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-160,A,expert_55,,,Mon Mar 18 2024 08:31:09 GMT-0400 (Eastern Daylight Time)
llama-13b,gpt-3.5-turbo,false,mtbench-160,B,expert_55,,,Sat Jun 22 2024 16:08:29 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-160,B,expert_34,,,Thu Dec 26 2024 21:19:18 GMT-0400 (Eastern Daylight Time)
llama-13b,vicuna-13b-v1.2,false,mtbench-160,B,expert_34,,,Sun Aug 11 2024 19:24:08 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-160,Tie,expert_0,,,Sun Jun 16 2024 23:55:24 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-160,B,expert_0,,,Thu Sep 26 2024 20:06:22 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-160,B,expert_36,,,Mon Jan 22 2024 04:49:57 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,claude-v1,false,mtbench-160,A,expert_36,,,Fri Jan 19 2024 21:41:51 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-160,Tie,author_4,,,Thu Dec 19 2024 13:11:33 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-160,Tie,author_4,,,Sat Jun 08 2024 16:05:37 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-160,B,expert_43,,,Fri Jun 21 2024 14:18:39 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,gpt-3.5-turbo,false,mtbench-160,B,expert_43,,,Tue Mar 19 2024 04:47:14 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-160,A,expert_0,,,Thu May 02 2024 09:20:59 GMT-0400 (Eastern Daylight Time)
vicuna-13b-v1.2,llama-13b,false,mtbench-160,A,expert_0,,,Sat Dec 07 2024 05:05:59 GMT-0400 (Eastern Daylight Time)
