Spaces:
Running
Running
update claude 4.5 flores results
Browse files
data/community_results/New Results - June2025.csv
CHANGED
|
@@ -1,72 +1,73 @@
|
|
| 1 |
-
model,task,prompt,eng,amh,hau,ibo,kin,lin,lug,orm,sna,sot,swa,xho,yor,zul,avg
|
| 2 |
-
Gemma 3 27b,injongointent,4.0,79.58,71.56,69.53,56.56,53.44,38.12,37.97,31.25,56.88,47.66,81.09,63.59,49.53,60.78,55.2
|
| 3 |
-
Gemma 3 27b,afrixnli,2.0,65.5,59.5,55.5,53.83,46.67,35.17,48.17,50.17,52.67,51.83,55.67,53.83,48.17,54.83,51.2
|
| 4 |
-
Gemma 3 27b,afrimmlu,1.0,74.2,52.6,45.2,47.0,44.6,36.8,34.0,34.2,45.2,44.8,60.2,44.8,40.2,47.0,44.4
|
| 5 |
-
Gemma 3 27b,afrimgsm,2.0,87.6,61.2,61.2,36.8,54.0,18.4,36.4,32.0,52.0,51.6,78.0,48.8,36.8,50.8,47.5
|
| 6 |
-
Gemma 3 27b,belebele,5.0,93.44,76.44,71.44,59.22,69.0,38.44,44.67,52.11,68.78,62.0,84.7,67.33,49.56,67.0,62.4
|
| 7 |
-
Gemma 3 27b,sib,3.0,87.25,83.33,80.4,81.86,82.84,59.8,67.16,58.33,76.47,72.55,72.06,77.45,71.08,80.88,74.2
|
| 8 |
-
Gemma 3 27b,flores - en_xx,,68.9,23.8,43.9,35.2,35.6,24.8,21.6,17.5,35.1,38.1,57.0,35.8,21.0,40.8,33.1
|
| 9 |
-
Gemini-2.0 Flash,injongointent,4.0,88.9,84.8,80.5,78.8,63.8,65.3,63.0,62.3,77.0,59.4,91.4,84.2,75.3,74.5,73.9
|
| 10 |
-
Gemini-2.0 Flash,sib,3.0,86.8,87.3,85.3,82.8,87.3,84.8,81.9,80.4,85.8,82.8,87.8,86.3,84.3,87.3,84.9
|
| 11 |
-
Gemini-2.0 Flash,afrixnli,3.0,87.0,74.2,72.0,68.7,62.5,32.2,67.5,70.0,71.5,68.7,74.0,71.8,63.2,68.3,66.5
|
| 12 |
-
Gemini-2.0 Flash,belebele,4.0,63.0,66.0,49.2,48.7,59.3,51.9,54.3,52.0,63.4,50.8,69.8,61.8,49.9,61.3,56.8
|
| 13 |
-
Gemini-2.0 Flash,afrimmlu,5.0,80.8,65.0,61.2,57.4,54.4,52.8,49.4,51.8,57.0,55.8,71.4,60.6,57.4,56.8,57.8
|
| 14 |
-
Gemini-2.0 Flash,afrimgsm,2.0,92.8,76.0,70.4,61.2,64.4,63.6,59.2,73.6,63.6,65.2,84.0,60.8,70.8,65.2,67.5
|
| 15 |
-
Gemini-2.0 Flash,flores - en_xx,2.0,71.5,66.0,60.9,57.8,59.2,51.7,52.2,54.7,54.8,63.6,70.3,62.4,50.5,64.2,59.1
|
| 16 |
-
Gemini-2.0 Flash,flores - xx_en,2.0,73.1,40.9,54.3,45.2,53.0,51.5,44.0,44.2,50.2,52.0,65.2,54.3,31.6,58.4,49.6
|
| 17 |
-
GPT-4.1 (April),injongointent,1.0,87.8,86.6,93.3,86.6,77.2,82.8,81.3,73.8,90.2,75.0,93.9,89.5,85.6,81.9,84.4
|
| 18 |
-
GPT-4.1 (April),sib,1.0,89.7,85.8,84.8,85.8,87.3,84.3,82.4,84.3,86.3,86.3,81.4,87.7,80.4,85.8,84.8
|
| 19 |
-
GPT-4.1 (April),afrixnli,1.0,88.5,70.8,72.7,69.0,69.3,32.0,67.0,68.0,73.7,71.5,72.8,74.0,67.2,69.8,67.5
|
| 20 |
-
GPT-4.1 (April),belebele,1.0,73.9,72.0,48.0,37.7,76.4,61.7,54.0,58.3,77.6,60.8,90.0,78.0,52.2,76.1,64.8
|
| 21 |
-
GPT-4.1 (April),afrimmlu,1.0,71.4,55.2,55.4,56.2,63.8,60.2,50.2,53.0,65.2,57.0,76.8,66.6,53.6,69.8,60.2
|
| 22 |
-
GPT-4.1 (April),afrimgsm,1.0,82.4,57.2,57.2,54.0,60.4,49.6,54.4,64.4,60.0,64.4,77.2,51.2,65.2,58.0,59.5
|
| 23 |
-
GPT-4.1 (April),flores - en_xx,1.0,73.1,32.5,53.1,42.0,53.2,48.7,41.3,41.6,49.6,50.6,65.5,53.6,27.5,55.7,47.3
|
| 24 |
-
LLaMa 4 405B,injongointent,4.0,88.9,84.8,80.5,78.8,63.8,65.3,63.0,62.3,77.0,59.4,91.4,84.2,75.3,74.5,73.9
|
| 25 |
-
LLaMa 4 405B,sib,3.0,84.8,86.8,80.9,82.4,74.5,84.3,79.4,71.6,77.5,77.9,86.8,84.8,78.9,81.9,80.6
|
| 26 |
-
LLaMa 4 405B,afrixnli,2.0,49.2,56.8,44.8,53.3,43.0,35.3,42.5,45.0,46.5,43.7,48.5,47.0,41.8,43.0,45.5
|
| 27 |
-
LLaMa 4 405B,belebele,5.0,25.0,24.78,24.11,24.44,24.67,25.22,24.78,24.22,24.67,25.22,24.56,24.78,23.89,24.33,24.6
|
| 28 |
-
LLaMa 4 405B,afrimmlu,1.0,11.2,18.4,16.2,18.0,14.2,10.8,14.8,16.0,15.2,16.0,15.6,16.4,16.8,17.0,15.8
|
| 29 |
-
LLaMa 4 405B,afrimgsm,4.0,97.6,83.2,68.8,64.4,60.0,52.0,46.8,58.8,67.2,65.2,89.2,61.2,64.8,64.0,65.0
|
| 30 |
-
LLaMa 4 405B,flores - en_xx,3.0,73.0,37.64,50.34,43.73,39.05,41.76,34.11,36.48,40.53,40.07,61.96,50.25,28.0,53.07,42.8
|
| 31 |
-
LLaMa 4 405B,flores - xx_en,3.0,71.55,62.57,56.47,53.5,54.28,43.12,44.89,46.96,50.36,56.32,67.83,58.03,44.82,60.64,53.8
|
| 32 |
-
Lugha-Llama 8B,injongointent,1.0,16.7,3.1,5.8,4.2,3.0,8.0,2.3,2.5,2.5,5.0,5.6,2.7,5.8,2.5,4.1
|
| 33 |
-
Lugha-Llama 8B,sib,1.0,43.6,43.6,32.4,30.9,41.7,24.5,34.8,42.2,29.4,30.4,42.6,27.0,43.1,21.1,34.1
|
| 34 |
-
Lugha-Llama 8B,afrixnli,1.0,46.8,37.0,37.3,37.2,35.5,33.3,34.2,36.2,35.8,35.8,39.7,37.2,38.7,38.7,36.7
|
| 35 |
-
Lugha-Llama 8B,belebele,1.0,22.4,23.1,22.9,22.9,23.2,22.9,23.7,22.1,23.2,22.7,23.4,22.8,22.9,23.1,23.0
|
| 36 |
-
Lugha-Llama 8B,afrimmlu,1.0,31.8,24.6,24.8,23.8,24.8,26.4,24.6,23.2,26.2,25.4,27.8,26.6,23.6,25.6,25.2
|
| 37 |
-
Lugha-Llama 8B,afrimgsm,1.0,6.4,2.4,0.8,2.0,1.2,0.8,2.4,1.6,0.8,2.0,2.0,2.0,2.4,3.6,1.8
|
| 38 |
-
Lugha-Llama 8B,flores - en_xx,1.0,51.3,7.9,19.3,25.5,29.2,9.6,15.3,5.7,30.3,25.9,40.9,31.3,16.9,29.4,22.1
|
| 39 |
-
Gemini-2.5
|
| 40 |
-
Gemini-2.5
|
| 41 |
-
Gemini-2.5
|
| 42 |
-
Gemini-2.5
|
| 43 |
-
Gemini-2.5
|
| 44 |
-
Gemini-2.5
|
| 45 |
-
Gemini-2.5
|
| 46 |
-
|
| 47 |
-
|
| 48 |
-
|
| 49 |
-
|
| 50 |
-
|
| 51 |
-
|
| 52 |
-
|
| 53 |
-
Claude
|
| 54 |
-
Claude
|
| 55 |
-
Claude
|
| 56 |
-
Claude
|
| 57 |
-
Claude
|
| 58 |
-
Claude
|
| 59 |
-
Claude
|
| 60 |
-
Claude 4
|
| 61 |
-
Claude 4
|
| 62 |
-
Claude 4
|
| 63 |
-
Claude 4
|
| 64 |
-
Claude 4
|
| 65 |
-
Claude 4
|
| 66 |
-
|
| 67 |
-
|
| 68 |
-
|
| 69 |
-
|
| 70 |
-
|
| 71 |
-
|
| 72 |
-
|
|
|
|
|
|
| 1 |
+
model,task,prompt,eng,amh,hau,ibo,kin,lin,lug,orm,sna,sot,swa,xho,yor,zul,avg
|
| 2 |
+
Gemma 3 27b,injongointent,4.0,79.58,71.56,69.53,56.56,53.44,38.12,37.97,31.25,56.88,47.66,81.09,63.59,49.53,60.78,55.2
|
| 3 |
+
Gemma 3 27b,afrixnli,2.0,65.5,59.5,55.5,53.83,46.67,35.17,48.17,50.17,52.67,51.83,55.67,53.83,48.17,54.83,51.2
|
| 4 |
+
Gemma 3 27b,afrimmlu,1.0,74.2,52.6,45.2,47.0,44.6,36.8,34.0,34.2,45.2,44.8,60.2,44.8,40.2,47.0,44.4
|
| 5 |
+
Gemma 3 27b,afrimgsm,2.0,87.6,61.2,61.2,36.8,54.0,18.4,36.4,32.0,52.0,51.6,78.0,48.8,36.8,50.8,47.5
|
| 6 |
+
Gemma 3 27b,belebele,5.0,93.44,76.44,71.44,59.22,69.0,38.44,44.67,52.11,68.78,62.0,84.7,67.33,49.56,67.0,62.4
|
| 7 |
+
Gemma 3 27b,sib,3.0,87.25,83.33,80.4,81.86,82.84,59.8,67.16,58.33,76.47,72.55,72.06,77.45,71.08,80.88,74.2
|
| 8 |
+
Gemma 3 27b,flores - en_xx,,68.9,23.8,43.9,35.2,35.6,24.8,21.6,17.5,35.1,38.1,57.0,35.8,21.0,40.8,33.1
|
| 9 |
+
Gemini-2.0 Flash,injongointent,4.0,88.9,84.8,80.5,78.8,63.8,65.3,63.0,62.3,77.0,59.4,91.4,84.2,75.3,74.5,73.9
|
| 10 |
+
Gemini-2.0 Flash,sib,3.0,86.8,87.3,85.3,82.8,87.3,84.8,81.9,80.4,85.8,82.8,87.8,86.3,84.3,87.3,84.9
|
| 11 |
+
Gemini-2.0 Flash,afrixnli,3.0,87.0,74.2,72.0,68.7,62.5,32.2,67.5,70.0,71.5,68.7,74.0,71.8,63.2,68.3,66.5
|
| 12 |
+
Gemini-2.0 Flash,belebele,4.0,63.0,66.0,49.2,48.7,59.3,51.9,54.3,52.0,63.4,50.8,69.8,61.8,49.9,61.3,56.8
|
| 13 |
+
Gemini-2.0 Flash,afrimmlu,5.0,80.8,65.0,61.2,57.4,54.4,52.8,49.4,51.8,57.0,55.8,71.4,60.6,57.4,56.8,57.8
|
| 14 |
+
Gemini-2.0 Flash,afrimgsm,2.0,92.8,76.0,70.4,61.2,64.4,63.6,59.2,73.6,63.6,65.2,84.0,60.8,70.8,65.2,67.5
|
| 15 |
+
Gemini-2.0 Flash,flores - en_xx,2.0,71.5,66.0,60.9,57.8,59.2,51.7,52.2,54.7,54.8,63.6,70.3,62.4,50.5,64.2,59.1
|
| 16 |
+
Gemini-2.0 Flash,flores - xx_en,2.0,73.1,40.9,54.3,45.2,53.0,51.5,44.0,44.2,50.2,52.0,65.2,54.3,31.6,58.4,49.6
|
| 17 |
+
GPT-4.1 (April),injongointent,1.0,87.8,86.6,93.3,86.6,77.2,82.8,81.3,73.8,90.2,75.0,93.9,89.5,85.6,81.9,84.4
|
| 18 |
+
GPT-4.1 (April),sib,1.0,89.7,85.8,84.8,85.8,87.3,84.3,82.4,84.3,86.3,86.3,81.4,87.7,80.4,85.8,84.8
|
| 19 |
+
GPT-4.1 (April),afrixnli,1.0,88.5,70.8,72.7,69.0,69.3,32.0,67.0,68.0,73.7,71.5,72.8,74.0,67.2,69.8,67.5
|
| 20 |
+
GPT-4.1 (April),belebele,1.0,73.9,72.0,48.0,37.7,76.4,61.7,54.0,58.3,77.6,60.8,90.0,78.0,52.2,76.1,64.8
|
| 21 |
+
GPT-4.1 (April),afrimmlu,1.0,71.4,55.2,55.4,56.2,63.8,60.2,50.2,53.0,65.2,57.0,76.8,66.6,53.6,69.8,60.2
|
| 22 |
+
GPT-4.1 (April),afrimgsm,1.0,82.4,57.2,57.2,54.0,60.4,49.6,54.4,64.4,60.0,64.4,77.2,51.2,65.2,58.0,59.5
|
| 23 |
+
GPT-4.1 (April),flores - en_xx,1.0,73.1,32.5,53.1,42.0,53.2,48.7,41.3,41.6,49.6,50.6,65.5,53.6,27.5,55.7,47.3
|
| 24 |
+
LLaMa 4 405B,injongointent,4.0,88.9,84.8,80.5,78.8,63.8,65.3,63.0,62.3,77.0,59.4,91.4,84.2,75.3,74.5,73.9
|
| 25 |
+
LLaMa 4 405B,sib,3.0,84.8,86.8,80.9,82.4,74.5,84.3,79.4,71.6,77.5,77.9,86.8,84.8,78.9,81.9,80.6
|
| 26 |
+
LLaMa 4 405B,afrixnli,2.0,49.2,56.8,44.8,53.3,43.0,35.3,42.5,45.0,46.5,43.7,48.5,47.0,41.8,43.0,45.5
|
| 27 |
+
LLaMa 4 405B,belebele,5.0,25.0,24.78,24.11,24.44,24.67,25.22,24.78,24.22,24.67,25.22,24.56,24.78,23.89,24.33,24.6
|
| 28 |
+
LLaMa 4 405B,afrimmlu,1.0,11.2,18.4,16.2,18.0,14.2,10.8,14.8,16.0,15.2,16.0,15.6,16.4,16.8,17.0,15.8
|
| 29 |
+
LLaMa 4 405B,afrimgsm,4.0,97.6,83.2,68.8,64.4,60.0,52.0,46.8,58.8,67.2,65.2,89.2,61.2,64.8,64.0,65.0
|
| 30 |
+
LLaMa 4 405B,flores - en_xx,3.0,73.0,37.64,50.34,43.73,39.05,41.76,34.11,36.48,40.53,40.07,61.96,50.25,28.0,53.07,42.8
|
| 31 |
+
LLaMa 4 405B,flores - xx_en,3.0,71.55,62.57,56.47,53.5,54.28,43.12,44.89,46.96,50.36,56.32,67.83,58.03,44.82,60.64,53.8
|
| 32 |
+
Lugha-Llama 8B,injongointent,1.0,16.7,3.1,5.8,4.2,3.0,8.0,2.3,2.5,2.5,5.0,5.6,2.7,5.8,2.5,4.1
|
| 33 |
+
Lugha-Llama 8B,sib,1.0,43.6,43.6,32.4,30.9,41.7,24.5,34.8,42.2,29.4,30.4,42.6,27.0,43.1,21.1,34.1
|
| 34 |
+
Lugha-Llama 8B,afrixnli,1.0,46.8,37.0,37.3,37.2,35.5,33.3,34.2,36.2,35.8,35.8,39.7,37.2,38.7,38.7,36.7
|
| 35 |
+
Lugha-Llama 8B,belebele,1.0,22.4,23.1,22.9,22.9,23.2,22.9,23.7,22.1,23.2,22.7,23.4,22.8,22.9,23.1,23.0
|
| 36 |
+
Lugha-Llama 8B,afrimmlu,1.0,31.8,24.6,24.8,23.8,24.8,26.4,24.6,23.2,26.2,25.4,27.8,26.6,23.6,25.6,25.2
|
| 37 |
+
Lugha-Llama 8B,afrimgsm,1.0,6.4,2.4,0.8,2.0,1.2,0.8,2.4,1.6,0.8,2.0,2.0,2.0,2.4,3.6,1.8
|
| 38 |
+
Lugha-Llama 8B,flores - en_xx,1.0,51.3,7.9,19.3,25.5,29.2,9.6,15.3,5.7,30.3,25.9,40.9,31.3,16.9,29.4,22.1
|
| 39 |
+
Gemini-2.5 Pro,afrixnli,3.0,90.0,79.8,76.3,79.2,72.3,32.2,73.2,78.2,78.2,74.0,76.5,78.5,72.0,75.3,72.7
|
| 40 |
+
Gemini-2.5 Pro,afrimgsm,2.0,89.2,80.8,74.8,75.2,74.4,62.8,63.2,82.8,77.6,72.8,88.4,66.8,77.6,69.6,74.4
|
| 41 |
+
Gemini-2.5 Pro,flores - en_xx,3.0,68.2,41.2,49.4,42.9,51.0,47.8,42.8,44.8,47.4,50.3,60.7,51.7,30.5,55.4,47.4
|
| 42 |
+
Gemini-2.5 Pro,afrimmlu,1.0,72.2,82.2,68.4,76.4,75.8,79.2,79.8,75.0,81.2,75.2,80.4,85.0,76.0,82.2,78.2
|
| 43 |
+
Gemini-2.5 Pro,injongointent,4.0,87.9,91.7,94.1,92.0,80.9,90.5,85.5,85.3,93.8,76.6,93.8,90.5,89.2,83.8,88.3
|
| 44 |
+
Gemini-2.5 Pro,sib,3.0,88.7,88.7,89.2,89.7,87.3,87.3,85.3,86.8,87.7,87.7,90.2,89.2,88.2,87.7,88.1
|
| 45 |
+
Gemini-2.5 Pro,belebele,5.0,78.1,85.6,56.1,62.2,80.9,78.9,75.4,74.1,84.4,73.7,87.8,86.3,68.8,83.0,76.7
|
| 46 |
+
Gemini-2.5 Flash,afrixnli,3.0,86.2,76.3,71.8,76.2,68.8,32.8,69.2,74.2,76.2,71.3,74.0,76.8,67.7,73.2,69.9
|
| 47 |
+
Gemini-2.5 Flash,afrimgsm,2.0,86.8,78.0,72.0,71.6,69.2,58.8,60.8,74.0,72.4,68.0,87.2,62.0,77.6,66.4,70.6
|
| 48 |
+
Gemini-2.5 Flash,flores - en_xx,3.0,67.8,41.5,50.1,42.8,50.4,46.4,41.0,43.0,46.7,48.4,60.6,50.9,28.2,54.4,46.5
|
| 49 |
+
Gemini-2.5 Flash,afrimmlu,1.0,83.6,74.4,60.6,62.4,62.2,70.0,71.2,72.6,69.4,61.4,56.6,73.8,72.0,73.8,67.7
|
| 50 |
+
Gemini-2.5 Flash,injongointent,4.0,89.1,92.8,95.0,91.4,80.5,86.7,85.5,82.8,92.3,76.9,95.0,89.8,89.8,83.8,87.9
|
| 51 |
+
Gemini-2.5 Flash,sib,3.0,90.2,87.7,86.8,85.3,85.8,90.2,85.8,87.3,85.3,87.3,89.2,88.7,86.8,87.7,87.2
|
| 52 |
+
Gemini-2.5 Flash,belebele,5.0,74.1,47.9,33.7,28.3,44.1,41.7,37.4,38.1,49.2,42.6,53.6,48.6,36.3,46.6,42.2
|
| 53 |
+
Claude 4.5 Sonnet,afrixnli,1.0,90.8,83.2,75.2,76.8,70.5,32.5,70.8,74.3,78.2,72.8,76.7,78.3,70.0,72.5,71.7
|
| 54 |
+
Claude 4.5 Sonnet,afrimgsm,4.0,96.4,80.8,73.2,72.8,71.2,65.2,63.6,74.8,68.4,73.6,91.6,68.4,77.6,69.6,73.1
|
| 55 |
+
Claude 4.5 Sonnet,flores - en_xx,3.0,69.7,41.8,51.1,44.0,49.0,47.7,41.2,41.7,45.8,49.8,60.4,51.3,29.8,52.8,46.6
|
| 56 |
+
Claude 4.5 Sonnet,afrimmlu,1.0,89.6,65.0,56.0,57.2,53.4,51.8,57.8,58.0,62.4,59.4,58.8,60.6,64.0,57.4,58.6
|
| 57 |
+
Claude 4.5 Sonnet,injongointent,4.0,88.3,90.6,89.2,83.8,70.8,78.6,75.9,71.9,86.1,70.3,93.6,87.3,83.4,79.8,81.6
|
| 58 |
+
Claude 4.5 Sonnet,sib,5.0,87.7,89.7,86.8,85.3,87.3,79.4,76.5,83.3,80.4,84.8,88.7,85.8,82.8,84.3,84.2
|
| 59 |
+
Claude 4.5 Sonnet,belebele,5.0,83.9,81.8,73.4,68.7,73.2,70.1,66.3,71.6,75.2,75.3,87.7,79.4,72.2,77.0,74.8
|
| 60 |
+
Claude 4 Sonnet,afrixnli,1.0,90.2,80.3,72.3,74.0,66.3,32.0,62.7,68.3,70.8,71.2,73.5,74.8,67.2,71.3,68.1
|
| 61 |
+
Claude 4 Sonnet,afrimgsm,4.0,94.0,76.4,68.8,63.6,63.2,58.8,55.6,64.8,68.0,66.8,86.0,59.6,71.2,67.2,66.9
|
| 62 |
+
Claude 4 Sonnet,flores - en_xx,3.0,69.8,41.1,51.1,43.5,47.8,47.6,41.0,41.2,44.9,48.8,60.0,51.6,27.6,52.4,46.0
|
| 63 |
+
Claude 4 Sonnet,afrimmlu,1.0,90.0,83.2,74.4,80.8,73.2,73.6,63.2,72.6,74.0,75.6,84.8,79.6,72.6,74.2,75.5
|
| 64 |
+
Claude 4 Sonnet,injongointent,4.0,89.7,90.6,88.3,84.7,69.1,77.0,74.5,67.8,84.8,68.0,92.5,87.0,81.6,78.8,80.4
|
| 65 |
+
Claude 4 Sonnet,sib,5.0,88.2,88.7,84.8,83.8,85.3,81.4,76.0,76.0,78.9,83.3,87.7,84.8,86.3,84.8,83.2
|
| 66 |
+
Claude 4 Sonnet,belebele,5.0,94.7,86.0,77.9,72.4,77.9,70.2,64.4,68.4,77.8,77.9,89.6,81.9,68.3,78.1,76.2
|
| 67 |
+
Claude 3.7 Sonnet,afrixnli,1.0,83.2,69.3,60.5,60.8,60.0,35.0,58.5,62.2,61.5,63.8,63.7,63.7,55.5,63.3,59.8
|
| 68 |
+
Claude 3.7 Sonnet,afrimgsm,4.0,60.4,46.0,30.4,30.4,37.2,26.8,30.8,32.8,30.8,36.0,53.2,32.0,38.4,33.2,35.2
|
| 69 |
+
Claude 3.7 Sonnet,flores - en_xx,3.0,69.9,37.6,45.6,39.1,46.8,45.4,40.4,38.9,40.9,50.9,60.5,47.9,27.7,50.3,44.0
|
| 70 |
+
Claude 3.7 Sonnet,afrimmlu,1.0,77.8,71.0,64.2,67.8,64.0,62.0,62.8,65.6,63.6,67.6,76.4,68.6,66.4,67.6,66.7
|
| 71 |
+
Claude 3.7 Sonnet,injongointent,4.0,84.1,82.0,79.2,72.3,66.4,65.3,71.4,59.8,76.4,64.2,88.8,82.2,73.8,71.9,73.4
|
| 72 |
+
Claude 3.7 Sonnet,sib,5.0,86.8,86.8,86.3,83.8,86.3,85.8,81.4,82.4,83.8,83.8,85.8,87.7,85.8,83.8,84.9
|
| 73 |
+
Claude 3.7 Sonnet,belebele,5.0,74.0,69.4,60.1,59.0,68.7,64.7,62.6,62.2,70.4,65.0,74.8,66.8,57.6,65.2,65.1
|