iteration,model,temperature,ccei
1,random,0.0,0.30081300813008127
2,random,0.0,0.29500000000000004
3,random,0.0,0.24739884393063583
4,random,0.0,0.2987012987012987
5,random,0.0,0.3548387096774194
6,random,0.0,0.3986486486486487
7,random,0.0,0.2810650887573965
8,random,0.0,0.35494880546075086
9,random,0.0,0.272
10,random,0.0,0.22171945701357465
11,random,0.0,0.3150105708245243
12,random,0.0,0.25641025641025644
13,random,0.0,0.1569506726457399
14,random,0.0,0.247787610619469
15,random,0.0,0.5156950672645739
16,random,0.0,0.2645739910313901
17,random,0.0,0.40444444444444444
18,random,0.0,0.27455919395465994
19,random,0.0,0.20800000000000002
20,random,0.0,0.20930232558139536
21,random,0.0,0.3823529411764706
22,random,0.0,0.49244712990936557
23,random,0.0,0.2
24,random,0.0,0.46881287726358145
25,random,0.0,0.30916414904330314
26,random,0.0,0.21908602150537634
27,random,0.0,0.21929824561403508
28,random,0.0,0.23555555555555555
29,random,0.0,0.4501510574018127
30,random,0.0,0.2896174863387978
1,llama3,0.0,0.5533333333333333
2,llama3,0.0,0.23636363636363636
3,llama3,0.0,0.38461538461538464
4,llama3,0.0,0.391304347826087
5,llama3,0.0,0.379746835443038
6,llama3,0.0,0.4473684210526316
7,llama3,0.0,0.2
8,llama3,0.0,0.45454545454545453
9,llama3,0.0,0.6133333333333333
10,llama3,0.0,0.4314720812182741
11,llama3,0.0,0.665
12,llama3,0.0,0.43533930857874514
13,llama3,0.0,0.5
14,llama3,0.0,0.519277108433735
15,llama3,0.0,0.27586206896551724
16,llama3,0.0,0.5555555555555556
17,llama3,0.0,0.5
18,llama3,0.0,0.35714285714285715
19,llama3,0.0,0.4246575342465753
20,llama3,0.0,0.25
21,llama3,0.0,0.23809523809523808
22,llama3,0.0,0.3333333333333333
23,llama3,0.0,0.475
24,llama3,0.0,0.6666666666666666
25,llama3,0.0,0.3151079136690647
26,llama3,0.0,0.3368421052631579
27,llama3,0.0,0.742
28,llama3,0.0,0.5333333333333333
29,llama3,0.0,0.5172413793103449
30,llama3,0.0,0.5
1,mistral-small,0.0,1.0
2,mistral-small,0.0,0.6222222222222222
3,mistral-small,0.0,0.8866666666666667
4,mistral-small,0.0,0.90625
5,mistral-small,0.0,0.6785714285714286
6,mistral-small,0.0,0.90625
7,mistral-small,0.0,0.5555555555555556
8,mistral-small,0.0,0.8844444444444444
9,mistral-small,0.0,0.8266666666666667
10,mistral-small,0.0,0.3333333333333333
11,mistral-small,0.0,0.8333333333333334
12,mistral-small,0.0,0.8888888888888888
13,mistral-small,0.0,0.925
14,mistral-small,0.0,0.78
15,mistral-small,0.0,0.804
16,mistral-small,0.0,0.75
17,mistral-small,0.0,0.84
18,mistral-small,0.0,0.625
19,mistral-small,0.0,0.90625
20,mistral-small,0.0,0.8166666666666667
21,mistral-small,0.0,0.875
22,mistral-small,0.0,0.9866666666666667
23,mistral-small,0.0,0.7733333333333333
24,mistral-small,0.0,0.92
25,mistral-small,0.0,0.8571428571428571
26,mistral-small,0.0,0.9375
27,mistral-small,0.0,0.7150000000000001
28,mistral-small,0.0,0.9625
29,mistral-small,0.0,0.8928571428571429
30,mistral-small,0.0,0.802
1,deepseek-r1,0.0,0.25
2,deepseek-r1,0.0,0.5882352941176471
3,deepseek-r1,0.0,0.42207792207792205
4,deepseek-r1,0.0,0.335
5,deepseek-r1,0.0,0.22105263157894736
6,deepseek-r1,0.0,0.22999999999999998
7,deepseek-r1,0.0,0.3058510638297872
8,deepseek-r1,0.0,0.32142857142857145
9,deepseek-r1,0.0,0.6711409395973154
10,deepseek-r1,0.0,0.25
11,deepseek-r1,0.0,0.75
12,deepseek-r1,0.0,0.8315217391304347
13,deepseek-r1,0.0,0.4597701149425288
14,deepseek-r1,0.0,0.32142857142857145
15,deepseek-r1,0.0,0.16875
16,deepseek-r1,0.0,0.25157232704402516
17,deepseek-r1,0.0,0.574712643678161
18,deepseek-r1,0.0,0.28776978417266186
19,deepseek-r1,0.0,0.32142857142857145
20,deepseek-r1,0.0,0.7304347826086957
21,deepseek-r1,0.0,0.17329910141206675
22,deepseek-r1,0.0,0.175
23,deepseek-r1,0.0,0.45454545454545453
24,deepseek-r1,0.0,0.2992700729927008
25,deepseek-r1,0.0,0.34
26,deepseek-r1,0.0,0.2
27,deepseek-r1,0.0,0.3333333333333333
28,deepseek-r1,0.0,0.1870967741935484
29,deepseek-r1,0.0,0.2575
30,deepseek-r1,0.0,0.1514285714285714
1,mixtral:8x7b,0.0,0.8152173913043478
2,mixtral:8x7b,0.0,0.8418604651162791
3,mixtral:8x7b,0.0,0.8540540540540541
4,mixtral:8x7b,0.0,0.875
5,mixtral:8x7b,0.0,0.8085106382978723
6,mixtral:8x7b,0.0,0.8444444444444444
7,mixtral:8x7b,0.0,0.9032258064516129
8,mixtral:8x7b,0.0,0.8298319327731092
9,mixtral:8x7b,0.0,0.8333333333333334
10,mixtral:8x7b,0.0,0.875
11,mixtral:8x7b,0.0,0.8260869565217391
12,mixtral:8x7b,0.0,0.82
13,mixtral:8x7b,0.0,0.8636363636363636
14,mixtral:8x7b,0.0,0.8333333333333334
15,mixtral:8x7b,0.0,0.8444444444444444
16,mixtral:8x7b,0.0,0.8636363636363636
17,mixtral:8x7b,0.0,0.82
18,mixtral:8x7b,0.0,0.82
19,mixtral:8x7b,0.0,0.8787878787878788
20,mixtral:8x7b,0.0,0.8285714285714286
21,mixtral:8x7b,0.0,0.8085106382978723
22,mixtral:8x7b,0.0,0.8787878787878788
23,mixtral:8x7b,0.0,0.8785714285714286
24,mixtral:8x7b,0.0,0.7894736842105263
25,mixtral:8x7b,0.0,0.8421052631578947
1,llama3.3:latest,0.0,1.0
2,llama3.3:latest,0.0,1.0
3,llama3.3:latest,0.0,1.0
4,llama3.3:latest,0.0,1.0
5,llama3.3:latest,0.0,1.0
6,llama3.3:latest,0.0,1.0
7,llama3.3:latest,0.0,1.0
8,llama3.3:latest,0.0,1.0
9,llama3.3:latest,0.0,1.0
10,llama3.3:latest,0.0,1.0
11,llama3.3:latest,0.0,1.0
12,llama3.3:latest,0.0,1.0
13,llama3.3:latest,0.0,1.0
14,llama3.3:latest,0.0,1.0
15,llama3.3:latest,0.0,1.0
16,llama3.3:latest,0.0,1.0
17,llama3.3:latest,0.0,1.0
18,llama3.3:latest,0.0,1.0
19,llama3.3:latest,0.0,1.0
20,llama3.3:latest,0.0,1.0
21,llama3.3:latest,0.0,1.0
22,llama3.3:latest,0.0,1.0
23,llama3.3:latest,0.0,1.0
24,llama3.3:latest,0.0,1.0
25,llama3.3:latest,0.0,1.0
26,llama3.3:latest,0.0,1.0
27,llama3.3:latest,0.0,1.0
28,llama3.3:latest,0.0,1.0
29,llama3.3:latest,0.0,1.0
30,llama3.3:latest,0.0,1.0
1,deepseek-r1:7b,0.0,1.0
2,deepseek-r1:7b,0.0,1.0
3,deepseek-r1:7b,0.0,1.0
4,deepseek-r1:7b,0.0,1.0
5,deepseek-r1:7b,0.0,1.0
6,deepseek-r1:7b,0.0,1.0
7,deepseek-r1:7b,0.0,1.0
8,deepseek-r1:7b,0.0,1.0
9,deepseek-r1:7b,0.0,1.0
10,deepseek-r1:7b,0.0,1.0
11,deepseek-r1:7b,0.0,1.0
12,deepseek-r1:7b,0.0,1.0
13,deepseek-r1:7b,0.0,1.0
14,deepseek-r1:7b,0.0,1.0
15,deepseek-r1:7b,0.0,1.0
16,deepseek-r1:7b,0.0,1.0
17,deepseek-r1:7b,0.0,1.0
18,deepseek-r1:7b,0.0,1.0
19,deepseek-r1:7b,0.0,1.0
20,deepseek-r1:7b,0.0,1.0
21,deepseek-r1:7b,0.0,1.0
22,deepseek-r1:7b,0.0,1.0
23,deepseek-r1:7b,0.0,1.0
24,deepseek-r1:7b,0.0,1.0
25,deepseek-r1:7b,0.0,1.0
26,deepseek-r1:7b,0.0,1.0
27,deepseek-r1:7b,0.0,1.0
28,deepseek-r1:7b,0.0,1.0
29,deepseek-r1:7b,0.0,1.0
30,deepseek-r1:7b,0.0,1.0
1,gpt-4.5-preview-2025-02-27,0.0,1.0
2,gpt-4.5-preview-2025-02-27,0.0,1.0
3,gpt-4.5-preview-2025-02-27,0.0,1.0
4,gpt-4.5-preview-2025-02-27,0.0,1.0
5,gpt-4.5-preview-2025-02-27,0.0,1.0
6,gpt-4.5-preview-2025-02-27,0.0,1.0
7,gpt-4.5-preview-2025-02-27,0.0,1.0
8,gpt-4.5-preview-2025-02-27,0.0,1.0
9,gpt-4.5-preview-2025-02-27,0.0,1.0
10,gpt-4.5-preview-2025-02-27,0.0,1.0
11,gpt-4.5-preview-2025-02-27,0.0,1.0
12,gpt-4.5-preview-2025-02-27,0.0,1.0
13,gpt-4.5-preview-2025-02-27,0.0,1.0
14,gpt-4.5-preview-2025-02-27,0.0,1.0
15,gpt-4.5-preview-2025-02-27,0.0,1.0
16,gpt-4.5-preview-2025-02-27,0.0,1.0
17,gpt-4.5-preview-2025-02-27,0.0,1.0
18,gpt-4.5-preview-2025-02-27,0.0,1.0
19,gpt-4.5-preview-2025-02-27,0.0,1.0
20,gpt-4.5-preview-2025-02-27,0.0,1.0
21,gpt-4.5-preview-2025-02-27,0.0,1.0
22,gpt-4.5-preview-2025-02-27,0.0,1.0
23,gpt-4.5-preview-2025-02-27,0.0,1.0
24,gpt-4.5-preview-2025-02-27,0.0,1.0
25,gpt-4.5-preview-2025-02-27,0.0,1.0
26,gpt-4.5-preview-2025-02-27,0.0,1.0
27,gpt-4.5-preview-2025-02-27,0.0,1.0
28,gpt-4.5-preview-2025-02-27,0.0,1.0
29,gpt-4.5-preview-2025-02-27,0.0,1.0
30,gpt-4.5-preview-2025-02-27,0.0,1.0
1,qwen3,0.0,1.0
2,qwen3,0.0,1.0
3,qwen3,0.0,1.0
4,qwen3,0.0,1.0
5,qwen3,0.0,1.0
6,qwen3,0.0,0.85
7,qwen3,0.0,1.0
8,qwen3,0.0,1.0
9,qwen3,0.0,1.0
10,qwen3,0.0,1.0
11,qwen3,0.0,1.0
12,qwen3,0.0,1.0
13,qwen3,0.0,1.0
14,qwen3,0.0,1.0
15,qwen3,0.0,1.0
16,qwen3,0.0,1.0
17,qwen3,0.0,1.0
18,qwen3,0.0,1.0
19,qwen3,0.0,1.0
20,qwen3,0.0,1.0
21,qwen3,0.0,0.85
22,qwen3,0.0,1.0
23,qwen3,0.0,1.0
24,qwen3,0.0,1.0
25,qwen3,0.0,1.0
26,qwen3,0.0,1.0
27,qwen3,0.0,1.0
28,qwen3,0.0,0.85
29,qwen3,0.0,1.0
30,qwen3,0.0,1.0

