update claude 4.5 flores results

#11
data/community_results/New Results - June2025.csv CHANGED
@@ -1,72 +1,73 @@
1
- model,task,prompt,eng,amh,hau,ibo,kin,lin,lug,orm,sna,sot,swa,xho,yor,zul,avg,prompt_num
2
- Gemma 3 27b,injongointent,4.0,79.58,71.56,69.53,56.56,53.44,38.12,37.97,31.25,56.88,47.66,81.09,63.59,49.53,60.78,55.2,
3
- Gemma 3 27b,afrixnli,2.0,65.5,59.5,55.5,53.83,46.67,35.17,48.17,50.17,52.67,51.83,55.67,53.83,48.17,54.83,51.2,
4
- Gemma 3 27b,afrimmlu,1.0,74.2,52.6,45.2,47.0,44.6,36.8,34.0,34.2,45.2,44.8,60.2,44.8,40.2,47.0,44.4,
5
- Gemma 3 27b,afrimgsm,2.0,87.6,61.2,61.2,36.8,54.0,18.4,36.4,32.0,52.0,51.6,78.0,48.8,36.8,50.8,47.5,
6
- Gemma 3 27b,belebele,5.0,93.44,76.44,71.44,59.22,69.0,38.44,44.67,52.11,68.78,62.0,84.7,67.33,49.56,67.0,62.4,
7
- Gemma 3 27b,sib,3.0,87.25,83.33,80.4,81.86,82.84,59.8,67.16,58.33,76.47,72.55,72.06,77.45,71.08,80.88,74.2,
8
- Gemma 3 27b,flores - en_xx,,68.9,23.8,43.9,35.2,35.6,24.8,21.6,17.5,35.1,38.1,57.0,35.8,21.0,40.8,33.1,
9
- Gemini-2.0 Flash,injongointent,4.0,88.9,84.8,80.5,78.8,63.8,65.3,63.0,62.3,77.0,59.4,91.4,84.2,75.3,74.5,73.9,
10
- Gemini-2.0 Flash,sib,3.0,86.8,87.3,85.3,82.8,87.3,84.8,81.9,80.4,85.8,82.8,87.8,86.3,84.3,87.3,84.9,
11
- Gemini-2.0 Flash,afrixnli,3.0,87.0,74.2,72.0,68.7,62.5,32.2,67.5,70.0,71.5,68.7,74.0,71.8,63.2,68.3,66.5,
12
- Gemini-2.0 Flash,belebele,4.0,63.0,66.0,49.2,48.7,59.3,51.9,54.3,52.0,63.4,50.8,69.8,61.8,49.9,61.3,56.8,
13
- Gemini-2.0 Flash,afrimmlu,5.0,80.8,65.0,61.2,57.4,54.4,52.8,49.4,51.8,57.0,55.8,71.4,60.6,57.4,56.8,57.8,
14
- Gemini-2.0 Flash,afrimgsm,2.0,92.8,76.0,70.4,61.2,64.4,63.6,59.2,73.6,63.6,65.2,84.0,60.8,70.8,65.2,67.5,
15
- Gemini-2.0 Flash,flores - en_xx,2.0,71.5,66.0,60.9,57.8,59.2,51.7,52.2,54.7,54.8,63.6,70.3,62.4,50.5,64.2,59.1,
16
- Gemini-2.0 Flash,flores - xx_en,2.0,73.1,40.9,54.3,45.2,53.0,51.5,44.0,44.2,50.2,52.0,65.2,54.3,31.6,58.4,49.6,
17
- GPT-4.1 (April),injongointent,1.0,87.8,86.6,93.3,86.6,77.2,82.8,81.3,73.8,90.2,75.0,93.9,89.5,85.6,81.9,84.4,
18
- GPT-4.1 (April),sib,1.0,89.7,85.8,84.8,85.8,87.3,84.3,82.4,84.3,86.3,86.3,81.4,87.7,80.4,85.8,84.8,
19
- GPT-4.1 (April),afrixnli,1.0,88.5,70.8,72.7,69.0,69.3,32.0,67.0,68.0,73.7,71.5,72.8,74.0,67.2,69.8,67.5,
20
- GPT-4.1 (April),belebele,1.0,73.9,72.0,48.0,37.7,76.4,61.7,54.0,58.3,77.6,60.8,90.0,78.0,52.2,76.1,64.8,
21
- GPT-4.1 (April),afrimmlu,1.0,71.4,55.2,55.4,56.2,63.8,60.2,50.2,53.0,65.2,57.0,76.8,66.6,53.6,69.8,60.2,
22
- GPT-4.1 (April),afrimgsm,1.0,82.4,57.2,57.2,54.0,60.4,49.6,54.4,64.4,60.0,64.4,77.2,51.2,65.2,58.0,59.5,
23
- GPT-4.1 (April),flores - en_xx,1.0,73.1,32.5,53.1,42.0,53.2,48.7,41.3,41.6,49.6,50.6,65.5,53.6,27.5,55.7,47.3,
24
- LLaMa 4 405B,injongointent,4.0,88.9,84.8,80.5,78.8,63.8,65.3,63.0,62.3,77.0,59.4,91.4,84.2,75.3,74.5,73.9,
25
- LLaMa 4 405B,sib,3.0,84.8,86.8,80.9,82.4,74.5,84.3,79.4,71.6,77.5,77.9,86.8,84.8,78.9,81.9,80.6,
26
- LLaMa 4 405B,afrixnli,2.0,49.2,56.8,44.8,53.3,43.0,35.3,42.5,45.0,46.5,43.7,48.5,47.0,41.8,43.0,45.5,
27
- LLaMa 4 405B,belebele,5.0,25.0,24.78,24.11,24.44,24.67,25.22,24.78,24.22,24.67,25.22,24.56,24.78,23.89,24.33,24.6,
28
- LLaMa 4 405B,afrimmlu,1.0,11.2,18.4,16.2,18.0,14.2,10.8,14.8,16.0,15.2,16.0,15.6,16.4,16.8,17.0,15.8,
29
- LLaMa 4 405B,afrimgsm,4.0,97.6,83.2,68.8,64.4,60.0,52.0,46.8,58.8,67.2,65.2,89.2,61.2,64.8,64.0,65.0,
30
- LLaMa 4 405B,flores - en_xx,3.0,73.0,37.64,50.34,43.73,39.05,41.76,34.11,36.48,40.53,40.07,61.96,50.25,28.0,53.07,42.8,
31
- LLaMa 4 405B,flores - xx_en,3.0,71.55,62.57,56.47,53.5,54.28,43.12,44.89,46.96,50.36,56.32,67.83,58.03,44.82,60.64,53.8,
32
- Lugha-Llama 8B,injongointent,1.0,16.7,3.1,5.8,4.2,3.0,8.0,2.3,2.5,2.5,5.0,5.6,2.7,5.8,2.5,4.1,
33
- Lugha-Llama 8B,sib,1.0,43.6,43.6,32.4,30.9,41.7,24.5,34.8,42.2,29.4,30.4,42.6,27.0,43.1,21.1,34.1,
34
- Lugha-Llama 8B,afrixnli,1.0,46.8,37.0,37.3,37.2,35.5,33.3,34.2,36.2,35.8,35.8,39.7,37.2,38.7,38.7,36.7,
35
- Lugha-Llama 8B,belebele,1.0,22.4,23.1,22.9,22.9,23.2,22.9,23.7,22.1,23.2,22.7,23.4,22.8,22.9,23.1,23.0,
36
- Lugha-Llama 8B,afrimmlu,1.0,31.8,24.6,24.8,23.8,24.8,26.4,24.6,23.2,26.2,25.4,27.8,26.6,23.6,25.6,25.2,
37
- Lugha-Llama 8B,afrimgsm,1.0,6.4,2.4,0.8,2.0,1.2,0.8,2.4,1.6,0.8,2.0,2.0,2.0,2.4,3.6,1.8,
38
- Lugha-Llama 8B,flores - en_xx,1.0,51.3,7.9,19.3,25.5,29.2,9.6,15.3,5.7,30.3,25.9,40.9,31.3,16.9,29.4,22.1,
39
- Gemini-2.5 Flash,afrixnli,,86.2,76.3,71.8,76.2,68.8,32.8,69.2,74.2,76.2,71.3,74.0,76.8,67.7,73.2,69.9,3.0
40
- Gemini-2.5 Flash,afrimgsm,,86.8,78.0,72.0,71.6,69.2,58.8,60.8,74.0,72.4,68.0,87.2,62.0,77.6,66.4,70.6,2.0
41
- Gemini-2.5 Flash,flores - en_xx,,67.8,41.5,50.1,42.8,50.4,46.4,41.0,43.0,46.7,48.4,60.6,50.9,28.2,54.4,46.5,3.0
42
- Gemini-2.5 Flash,afrimmlu,,83.6,74.4,60.6,62.4,62.2,70.0,71.2,72.6,69.4,61.4,56.6,73.8,72.0,73.8,67.7,1.0
43
- Gemini-2.5 Flash,injongointent,,89.1,92.8,95.0,91.4,80.5,86.7,85.5,82.8,92.3,76.9,95.0,89.8,89.8,83.8,87.9,4.0
44
- Gemini-2.5 Flash,sib,,90.2,87.7,86.8,85.3,85.8,90.2,85.8,87.3,85.3,87.3,89.2,88.7,86.8,87.7,87.2,3.0
45
- Gemini-2.5 Flash,belebele,,74.1,47.9,33.7,28.3,44.1,41.7,37.4,38.1,49.2,42.6,53.6,48.6,36.3,46.6,42.2,5.0
46
- Claude 4.0 Sonnet,afrixnli,,90.2,80.3,72.3,74.0,66.3,32.0,62.7,68.3,70.8,71.2,73.5,74.8,67.2,71.3,68.1,1.0
47
- Claude 4.0 Sonnet,afrimgsm,,94.0,76.4,68.8,63.6,63.2,58.8,55.6,64.8,68.0,66.8,86.0,59.6,71.2,67.2,66.9,4.0
48
- Claude 4.0 Sonnet,flores - en_xx,,69.8,41.1,51.1,43.5,47.8,47.6,41.0,41.2,44.9,48.8,60.0,51.6,27.6,52.4,46.0,3.0
49
- Claude 4.0 Sonnet,afrimmlu,,90.0,83.2,74.4,80.8,73.2,73.6,63.2,72.6,74.0,75.6,84.8,79.6,72.6,74.2,75.5,1.0
50
- Claude 4.0 Sonnet,injongointent,,89.7,90.6,88.3,84.7,69.1,77.0,74.5,67.8,84.8,68.0,92.5,87.0,81.6,78.8,80.4,4.0
51
- Claude 4.0 Sonnet,sib,,88.2,88.7,84.8,83.8,85.3,81.4,76.0,76.0,78.9,83.3,87.7,84.8,86.3,84.8,83.2,5.0
52
- Claude 4.0 Sonnet,belebele,,94.7,86.0,77.9,72.4,77.9,70.2,64.4,68.4,77.8,77.9,89.6,81.9,68.3,78.1,76.2,5.0
53
- Claude 3.7 Sonnet,afrixnli,,83.2,69.3,60.5,60.8,60.0,35.0,58.5,62.2,61.5,63.8,63.7,63.7,55.5,63.3,59.8,1.0
54
- Claude 3.7 Sonnet,afrimgsm,,60.4,46.0,30.4,30.4,37.2,26.8,30.8,32.8,30.8,36.0,53.2,32.0,38.4,33.2,35.2,4.0
55
- Claude 3.7 Sonnet,flores - en_xx,,69.9,37.6,45.6,39.1,46.8,45.4,40.4,38.9,40.9,50.9,60.5,47.9,27.7,50.3,44.0,3.0
56
- Claude 3.7 Sonnet,afrimmlu,,77.8,71.0,64.2,67.8,64.0,62.0,62.8,65.6,63.6,67.6,76.4,68.6,66.4,67.6,66.7,1.0
57
- Claude 3.7 Sonnet,injongointent,,84.1,82.0,79.2,72.3,66.4,65.3,71.4,59.8,76.4,64.2,88.8,82.2,73.8,71.9,73.4,4.0
58
- Claude 3.7 Sonnet,sib,,86.8,86.8,86.3,83.8,86.3,85.8,81.4,82.4,83.8,83.8,85.8,87.7,85.8,83.8,84.9,5.0
59
- Claude 3.7 Sonnet,belebele,,74.0,69.4,60.1,59.0,68.7,64.7,62.6,62.2,70.4,65.0,74.8,66.8,57.6,65.2,65.1,5.0
60
- Claude 4.5 Sonnet,afrixnli,,90.8,83.2,75.2,76.8,70.5,32.5,70.8,74.3,78.2,72.8,76.7,78.3,70.0,72.5,71.7,1.0
61
- Claude 4.5 Sonnet,afrimgsm,,96.4,80.8,73.2,72.8,71.2,65.2,63.6,74.8,68.4,73.6,91.6,68.4,77.6,69.6,73.1,4.0
62
- Claude 4.5 Sonnet,afrimmlu,,89.6,65.0,56.0,57.2,53.4,51.8,57.8,58.0,62.4,59.4,58.8,60.6,64.0,57.4,58.6,1.0
63
- Claude 4.5 Sonnet,injongointent,,88.3,90.6,89.2,83.8,70.8,78.6,75.9,71.9,86.1,70.3,93.6,87.3,83.4,79.8,81.6,4.0
64
- Claude 4.5 Sonnet,sib,,87.7,89.7,86.8,85.3,87.3,79.4,76.5,83.3,80.4,84.8,88.7,85.8,82.8,84.3,84.2,5.0
65
- Claude 4.5 Sonnet,belebele,,83.9,81.8,73.4,68.7,73.2,70.1,66.3,71.6,75.2,75.3,87.7,79.4,72.2,77.0,74.8,5.0
66
- Gemini 2.5 Pro,afrixnli,,90.0,79.8,76.3,79.2,72.3,32.2,73.2,78.2,78.2,74.0,76.5,78.5,72.0,75.3,72.7,3.0
67
- Gemini 2.5 Pro,afrimgsm,,89.2,80.8,74.8,75.2,74.4,62.8,63.2,82.8,77.6,72.8,88.4,66.8,77.6,69.6,74.4,2.0
68
- Gemini 2.5 Pro,flores - en_xx,,68.2,41.2,49.4,42.9,51.0,47.8,42.8,44.8,47.4,50.3,60.7,51.7,30.5,55.4,47.4,3.0
69
- Gemini 2.5 Pro,afrimmlu,,72.2,82.2,68.4,76.4,75.8,79.2,79.8,75.0,81.2,75.2,80.4,85.0,76.0,82.2,78.2,1.0
70
- Gemini 2.5 Pro,injongointent,,87.9,91.7,94.1,92.0,80.9,90.5,85.5,85.3,93.8,76.6,93.8,90.5,89.2,83.8,88.3,4.0
71
- Gemini 2.5 Pro,sib,,88.7,88.7,89.2,89.7,87.3,87.3,85.3,86.8,87.7,87.7,90.2,89.2,88.2,87.7,88.1,3.0
72
- Gemini 2.5 Pro,belebele,,78.1,85.6,56.1,62.2,80.9,78.9,75.4,74.1,84.4,73.7,87.8,86.3,68.8,83.0,76.7,5.0
 
 
1
+ model,task,prompt,eng,amh,hau,ibo,kin,lin,lug,orm,sna,sot,swa,xho,yor,zul,avg
2
+ Gemma 3 27b,injongointent,4.0,79.58,71.56,69.53,56.56,53.44,38.12,37.97,31.25,56.88,47.66,81.09,63.59,49.53,60.78,55.2
3
+ Gemma 3 27b,afrixnli,2.0,65.5,59.5,55.5,53.83,46.67,35.17,48.17,50.17,52.67,51.83,55.67,53.83,48.17,54.83,51.2
4
+ Gemma 3 27b,afrimmlu,1.0,74.2,52.6,45.2,47.0,44.6,36.8,34.0,34.2,45.2,44.8,60.2,44.8,40.2,47.0,44.4
5
+ Gemma 3 27b,afrimgsm,2.0,87.6,61.2,61.2,36.8,54.0,18.4,36.4,32.0,52.0,51.6,78.0,48.8,36.8,50.8,47.5
6
+ Gemma 3 27b,belebele,5.0,93.44,76.44,71.44,59.22,69.0,38.44,44.67,52.11,68.78,62.0,84.7,67.33,49.56,67.0,62.4
7
+ Gemma 3 27b,sib,3.0,87.25,83.33,80.4,81.86,82.84,59.8,67.16,58.33,76.47,72.55,72.06,77.45,71.08,80.88,74.2
8
+ Gemma 3 27b,flores - en_xx,,68.9,23.8,43.9,35.2,35.6,24.8,21.6,17.5,35.1,38.1,57.0,35.8,21.0,40.8,33.1
9
+ Gemini-2.0 Flash,injongointent,4.0,88.9,84.8,80.5,78.8,63.8,65.3,63.0,62.3,77.0,59.4,91.4,84.2,75.3,74.5,73.9
10
+ Gemini-2.0 Flash,sib,3.0,86.8,87.3,85.3,82.8,87.3,84.8,81.9,80.4,85.8,82.8,87.8,86.3,84.3,87.3,84.9
11
+ Gemini-2.0 Flash,afrixnli,3.0,87.0,74.2,72.0,68.7,62.5,32.2,67.5,70.0,71.5,68.7,74.0,71.8,63.2,68.3,66.5
12
+ Gemini-2.0 Flash,belebele,4.0,63.0,66.0,49.2,48.7,59.3,51.9,54.3,52.0,63.4,50.8,69.8,61.8,49.9,61.3,56.8
13
+ Gemini-2.0 Flash,afrimmlu,5.0,80.8,65.0,61.2,57.4,54.4,52.8,49.4,51.8,57.0,55.8,71.4,60.6,57.4,56.8,57.8
14
+ Gemini-2.0 Flash,afrimgsm,2.0,92.8,76.0,70.4,61.2,64.4,63.6,59.2,73.6,63.6,65.2,84.0,60.8,70.8,65.2,67.5
15
+ Gemini-2.0 Flash,flores - en_xx,2.0,71.5,66.0,60.9,57.8,59.2,51.7,52.2,54.7,54.8,63.6,70.3,62.4,50.5,64.2,59.1
16
+ Gemini-2.0 Flash,flores - xx_en,2.0,73.1,40.9,54.3,45.2,53.0,51.5,44.0,44.2,50.2,52.0,65.2,54.3,31.6,58.4,49.6
17
+ GPT-4.1 (April),injongointent,1.0,87.8,86.6,93.3,86.6,77.2,82.8,81.3,73.8,90.2,75.0,93.9,89.5,85.6,81.9,84.4
18
+ GPT-4.1 (April),sib,1.0,89.7,85.8,84.8,85.8,87.3,84.3,82.4,84.3,86.3,86.3,81.4,87.7,80.4,85.8,84.8
19
+ GPT-4.1 (April),afrixnli,1.0,88.5,70.8,72.7,69.0,69.3,32.0,67.0,68.0,73.7,71.5,72.8,74.0,67.2,69.8,67.5
20
+ GPT-4.1 (April),belebele,1.0,73.9,72.0,48.0,37.7,76.4,61.7,54.0,58.3,77.6,60.8,90.0,78.0,52.2,76.1,64.8
21
+ GPT-4.1 (April),afrimmlu,1.0,71.4,55.2,55.4,56.2,63.8,60.2,50.2,53.0,65.2,57.0,76.8,66.6,53.6,69.8,60.2
22
+ GPT-4.1 (April),afrimgsm,1.0,82.4,57.2,57.2,54.0,60.4,49.6,54.4,64.4,60.0,64.4,77.2,51.2,65.2,58.0,59.5
23
+ GPT-4.1 (April),flores - en_xx,1.0,73.1,32.5,53.1,42.0,53.2,48.7,41.3,41.6,49.6,50.6,65.5,53.6,27.5,55.7,47.3
24
+ LLaMa 4 405B,injongointent,4.0,88.9,84.8,80.5,78.8,63.8,65.3,63.0,62.3,77.0,59.4,91.4,84.2,75.3,74.5,73.9
25
+ LLaMa 4 405B,sib,3.0,84.8,86.8,80.9,82.4,74.5,84.3,79.4,71.6,77.5,77.9,86.8,84.8,78.9,81.9,80.6
26
+ LLaMa 4 405B,afrixnli,2.0,49.2,56.8,44.8,53.3,43.0,35.3,42.5,45.0,46.5,43.7,48.5,47.0,41.8,43.0,45.5
27
+ LLaMa 4 405B,belebele,5.0,25.0,24.78,24.11,24.44,24.67,25.22,24.78,24.22,24.67,25.22,24.56,24.78,23.89,24.33,24.6
28
+ LLaMa 4 405B,afrimmlu,1.0,11.2,18.4,16.2,18.0,14.2,10.8,14.8,16.0,15.2,16.0,15.6,16.4,16.8,17.0,15.8
29
+ LLaMa 4 405B,afrimgsm,4.0,97.6,83.2,68.8,64.4,60.0,52.0,46.8,58.8,67.2,65.2,89.2,61.2,64.8,64.0,65.0
30
+ LLaMa 4 405B,flores - en_xx,3.0,73.0,37.64,50.34,43.73,39.05,41.76,34.11,36.48,40.53,40.07,61.96,50.25,28.0,53.07,42.8
31
+ LLaMa 4 405B,flores - xx_en,3.0,71.55,62.57,56.47,53.5,54.28,43.12,44.89,46.96,50.36,56.32,67.83,58.03,44.82,60.64,53.8
32
+ Lugha-Llama 8B,injongointent,1.0,16.7,3.1,5.8,4.2,3.0,8.0,2.3,2.5,2.5,5.0,5.6,2.7,5.8,2.5,4.1
33
+ Lugha-Llama 8B,sib,1.0,43.6,43.6,32.4,30.9,41.7,24.5,34.8,42.2,29.4,30.4,42.6,27.0,43.1,21.1,34.1
34
+ Lugha-Llama 8B,afrixnli,1.0,46.8,37.0,37.3,37.2,35.5,33.3,34.2,36.2,35.8,35.8,39.7,37.2,38.7,38.7,36.7
35
+ Lugha-Llama 8B,belebele,1.0,22.4,23.1,22.9,22.9,23.2,22.9,23.7,22.1,23.2,22.7,23.4,22.8,22.9,23.1,23.0
36
+ Lugha-Llama 8B,afrimmlu,1.0,31.8,24.6,24.8,23.8,24.8,26.4,24.6,23.2,26.2,25.4,27.8,26.6,23.6,25.6,25.2
37
+ Lugha-Llama 8B,afrimgsm,1.0,6.4,2.4,0.8,2.0,1.2,0.8,2.4,1.6,0.8,2.0,2.0,2.0,2.4,3.6,1.8
38
+ Lugha-Llama 8B,flores - en_xx,1.0,51.3,7.9,19.3,25.5,29.2,9.6,15.3,5.7,30.3,25.9,40.9,31.3,16.9,29.4,22.1
39
+ Gemini-2.5 Pro,afrixnli,3.0,90.0,79.8,76.3,79.2,72.3,32.2,73.2,78.2,78.2,74.0,76.5,78.5,72.0,75.3,72.7
40
+ Gemini-2.5 Pro,afrimgsm,2.0,89.2,80.8,74.8,75.2,74.4,62.8,63.2,82.8,77.6,72.8,88.4,66.8,77.6,69.6,74.4
41
+ Gemini-2.5 Pro,flores - en_xx,3.0,68.2,41.2,49.4,42.9,51.0,47.8,42.8,44.8,47.4,50.3,60.7,51.7,30.5,55.4,47.4
42
+ Gemini-2.5 Pro,afrimmlu,1.0,72.2,82.2,68.4,76.4,75.8,79.2,79.8,75.0,81.2,75.2,80.4,85.0,76.0,82.2,78.2
43
+ Gemini-2.5 Pro,injongointent,4.0,87.9,91.7,94.1,92.0,80.9,90.5,85.5,85.3,93.8,76.6,93.8,90.5,89.2,83.8,88.3
44
+ Gemini-2.5 Pro,sib,3.0,88.7,88.7,89.2,89.7,87.3,87.3,85.3,86.8,87.7,87.7,90.2,89.2,88.2,87.7,88.1
45
+ Gemini-2.5 Pro,belebele,5.0,78.1,85.6,56.1,62.2,80.9,78.9,75.4,74.1,84.4,73.7,87.8,86.3,68.8,83.0,76.7
46
+ Gemini-2.5 Flash,afrixnli,3.0,86.2,76.3,71.8,76.2,68.8,32.8,69.2,74.2,76.2,71.3,74.0,76.8,67.7,73.2,69.9
47
+ Gemini-2.5 Flash,afrimgsm,2.0,86.8,78.0,72.0,71.6,69.2,58.8,60.8,74.0,72.4,68.0,87.2,62.0,77.6,66.4,70.6
48
+ Gemini-2.5 Flash,flores - en_xx,3.0,67.8,41.5,50.1,42.8,50.4,46.4,41.0,43.0,46.7,48.4,60.6,50.9,28.2,54.4,46.5
49
+ Gemini-2.5 Flash,afrimmlu,1.0,83.6,74.4,60.6,62.4,62.2,70.0,71.2,72.6,69.4,61.4,56.6,73.8,72.0,73.8,67.7
50
+ Gemini-2.5 Flash,injongointent,4.0,89.1,92.8,95.0,91.4,80.5,86.7,85.5,82.8,92.3,76.9,95.0,89.8,89.8,83.8,87.9
51
+ Gemini-2.5 Flash,sib,3.0,90.2,87.7,86.8,85.3,85.8,90.2,85.8,87.3,85.3,87.3,89.2,88.7,86.8,87.7,87.2
52
+ Gemini-2.5 Flash,belebele,5.0,74.1,47.9,33.7,28.3,44.1,41.7,37.4,38.1,49.2,42.6,53.6,48.6,36.3,46.6,42.2
53
+ Claude 4.5 Sonnet,afrixnli,1.0,90.8,83.2,75.2,76.8,70.5,32.5,70.8,74.3,78.2,72.8,76.7,78.3,70.0,72.5,71.7
54
+ Claude 4.5 Sonnet,afrimgsm,4.0,96.4,80.8,73.2,72.8,71.2,65.2,63.6,74.8,68.4,73.6,91.6,68.4,77.6,69.6,73.1
55
+ Claude 4.5 Sonnet,flores - en_xx,3.0,69.7,41.8,51.1,44.0,49.0,47.7,41.2,41.7,45.8,49.8,60.4,51.3,29.8,52.8,46.6
56
+ Claude 4.5 Sonnet,afrimmlu,1.0,89.6,65.0,56.0,57.2,53.4,51.8,57.8,58.0,62.4,59.4,58.8,60.6,64.0,57.4,58.6
57
+ Claude 4.5 Sonnet,injongointent,4.0,88.3,90.6,89.2,83.8,70.8,78.6,75.9,71.9,86.1,70.3,93.6,87.3,83.4,79.8,81.6
58
+ Claude 4.5 Sonnet,sib,5.0,87.7,89.7,86.8,85.3,87.3,79.4,76.5,83.3,80.4,84.8,88.7,85.8,82.8,84.3,84.2
59
+ Claude 4.5 Sonnet,belebele,5.0,83.9,81.8,73.4,68.7,73.2,70.1,66.3,71.6,75.2,75.3,87.7,79.4,72.2,77.0,74.8
60
+ Claude 3.7 Sonnet,afrixnli,1.0,83.2,69.3,60.5,60.8,60.0,35.0,58.5,62.2,61.5,63.8,63.7,63.7,55.5,63.3,59.8
61
+ Claude 3.7 Sonnet,afrimgsm,4.0,60.4,46.0,30.4,30.4,37.2,26.8,30.8,32.8,30.8,36.0,53.2,32.0,38.4,33.2,35.2
62
+ Claude 3.7 Sonnet,flores - en_xx,3.0,69.9,37.6,45.6,39.1,46.8,45.4,40.4,38.9,40.9,50.9,60.5,47.9,27.7,50.3,44.0
63
+ Claude 3.7 Sonnet,afrimmlu,1.0,77.8,71.0,64.2,67.8,64.0,62.0,62.8,65.6,63.6,67.6,76.4,68.6,66.4,67.6,66.7
64
+ Claude 3.7 Sonnet,injongointent,4.0,84.1,82.0,79.2,72.3,66.4,65.3,71.4,59.8,76.4,64.2,88.8,82.2,73.8,71.9,73.4
65
+ Claude 3.7 Sonnet,sib,5.0,86.8,86.8,86.3,83.8,86.3,85.8,81.4,82.4,83.8,83.8,85.8,87.7,85.8,83.8,84.9
66
+ Claude 3.7 Sonnet,belebele,5.0,74.0,69.4,60.1,59.0,68.7,64.7,62.6,62.2,70.4,65.0,74.8,66.8,57.6,65.2,65.1
67
+ Claude 4.0 Sonnet,afrixnli,1.0,90.2,80.3,72.3,74.0,66.3,32.0,62.7,68.3,70.8,71.2,73.5,74.8,67.2,71.3,68.1
68
+ Claude 4.0 Sonnet,afrimgsm,4.0,94.0,76.4,68.8,63.6,63.2,58.8,55.6,64.8,68.0,66.8,86.0,59.6,71.2,67.2,66.9
69
+ Claude 4.0 Sonnet,flores - en_xx,3.0,69.8,41.1,51.1,43.5,47.8,47.6,41.0,41.2,44.9,48.8,60.0,51.6,27.6,52.4,46.0
70
+ Claude 4.0 Sonnet,afrimmlu,1.0,90.0,83.2,74.4,80.8,73.2,73.6,63.2,72.6,74.0,75.6,84.8,79.6,72.6,74.2,75.5
71
+ Claude 4.0 Sonnet,injongointent,4.0,89.7,90.6,88.3,84.7,69.1,77.0,74.5,67.8,84.8,68.0,92.5,87.0,81.6,78.8,80.4
72
+ Claude 4.0 Sonnet,sib,5.0,88.2,88.7,84.8,83.8,85.3,81.4,76.0,76.0,78.9,83.3,87.7,84.8,86.3,84.8,83.2
73
+ Claude 4.0 Sonnet,belebele,5.0,94.7,86.0,77.9,72.4,77.9,70.2,64.4,68.4,77.8,77.9,89.6,81.9,68.3,78.1,76.2
data/leaderboard_json/afrobench_lite.json CHANGED
@@ -18,11 +18,11 @@
18
  "GPT-4.1 (April)": 67.5,
19
  "LLaMa 4 405B": 45.5,
20
  "Lugha-Llama 8B": 36.7,
 
21
  "Gemini-2.5 Flash": 69.9,
22
- "Claude 4.0 Sonnet": 68.1,
23
- "Claude 3.7 Sonnet": 59.8,
24
  "Claude 4.5 Sonnet": 71.7,
25
- "Gemini 2.5 Pro": 72.7
 
26
  }
27
  },
28
  "Intent": {
@@ -44,11 +44,11 @@
44
  "GPT-4.1 (April)": 84.4,
45
  "LLaMa 4 405B": 73.9,
46
  "Lugha-Llama 8B": 4.1,
 
47
  "Gemini-2.5 Flash": 87.9,
48
- "Claude 4.0 Sonnet": 80.4,
49
- "Claude 3.7 Sonnet": 73.4,
50
  "Claude 4.5 Sonnet": 81.6,
51
- "Gemini 2.5 Pro": 88.3
 
52
  }
53
  },
54
  "MT(en/fr-xx)": {
@@ -70,10 +70,11 @@
70
  "GPT-4.1 (April)": 47.3,
71
  "LLaMa 4 405B": 42.8,
72
  "Lugha-Llama 8B": 22.1,
 
73
  "Gemini-2.5 Flash": 46.5,
74
- "Claude 4.0 Sonnet": 46.0,
75
  "Claude 3.7 Sonnet": 44.0,
76
- "Gemini 2.5 Pro": 47.4
77
  }
78
  },
79
  "MMLU": {
@@ -95,11 +96,11 @@
95
  "GPT-4.1 (April)": 60.2,
96
  "LLaMa 4 405B": 15.8,
97
  "Lugha-Llama 8B": 25.2,
 
98
  "Gemini-2.5 Flash": 67.7,
99
- "Claude 4.0 Sonnet": 75.5,
100
- "Claude 3.7 Sonnet": 66.7,
101
  "Claude 4.5 Sonnet": 58.6,
102
- "Gemini 2.5 Pro": 78.2
 
103
  }
104
  },
105
  "Math": {
@@ -121,11 +122,11 @@
121
  "GPT-4.1 (April)": 59.5,
122
  "LLaMa 4 405B": 65.0,
123
  "Lugha-Llama 8B": 1.8,
 
124
  "Gemini-2.5 Flash": 70.6,
125
- "Claude 4.0 Sonnet": 66.9,
126
- "Claude 3.7 Sonnet": 35.2,
127
  "Claude 4.5 Sonnet": 73.1,
128
- "Gemini 2.5 Pro": 74.4
 
129
  }
130
  },
131
  "Topic": {
@@ -147,11 +148,11 @@
147
  "GPT-4.1 (April)": 84.8,
148
  "LLaMa 4 405B": 80.6,
149
  "Lugha-Llama 8B": 34.1,
 
150
  "Gemini-2.5 Flash": 87.2,
151
- "Claude 4.0 Sonnet": 83.2,
152
- "Claude 3.7 Sonnet": 84.9,
153
  "Claude 4.5 Sonnet": 84.2,
154
- "Gemini 2.5 Pro": 88.1
 
155
  }
156
  },
157
  "RC": {
@@ -173,11 +174,11 @@
173
  "GPT-4.1 (April)": 64.8,
174
  "LLaMa 4 405B": 24.6,
175
  "Lugha-Llama 8B": 23.0,
 
176
  "Gemini-2.5 Flash": 42.2,
177
- "Claude 4.0 Sonnet": 76.2,
178
- "Claude 3.7 Sonnet": 65.1,
179
  "Claude 4.5 Sonnet": 74.8,
180
- "Gemini 2.5 Pro": 76.7
 
181
  }
182
  }
183
  }
 
18
  "GPT-4.1 (April)": 67.5,
19
  "LLaMa 4 405B": 45.5,
20
  "Lugha-Llama 8B": 36.7,
21
+ "Gemini-2.5 Pro": 72.7,
22
  "Gemini-2.5 Flash": 69.9,
 
 
23
  "Claude 4.5 Sonnet": 71.7,
24
+ "Claude 3.7 Sonnet": 59.8,
25
+ "Claude 4.0 Sonnet": 68.1
26
  }
27
  },
28
  "Intent": {
 
44
  "GPT-4.1 (April)": 84.4,
45
  "LLaMa 4 405B": 73.9,
46
  "Lugha-Llama 8B": 4.1,
47
+ "Gemini-2.5 Pro": 88.3,
48
  "Gemini-2.5 Flash": 87.9,
 
 
49
  "Claude 4.5 Sonnet": 81.6,
50
+ "Claude 3.7 Sonnet": 73.4,
51
+ "Claude 4.0 Sonnet": 80.4
52
  }
53
  },
54
  "MT(en/fr-xx)": {
 
70
  "GPT-4.1 (April)": 47.3,
71
  "LLaMa 4 405B": 42.8,
72
  "Lugha-Llama 8B": 22.1,
73
+ "Gemini-2.5 Pro": 47.4,
74
  "Gemini-2.5 Flash": 46.5,
75
+ "Claude 4.5 Sonnet": 46.6,
76
  "Claude 3.7 Sonnet": 44.0,
77
+ "Claude 4.0 Sonnet": 46.0
78
  }
79
  },
80
  "MMLU": {
 
96
  "GPT-4.1 (April)": 60.2,
97
  "LLaMa 4 405B": 15.8,
98
  "Lugha-Llama 8B": 25.2,
99
+ "Gemini-2.5 Pro": 78.2,
100
  "Gemini-2.5 Flash": 67.7,
 
 
101
  "Claude 4.5 Sonnet": 58.6,
102
+ "Claude 3.7 Sonnet": 66.7,
103
+ "Claude 4.0 Sonnet": 75.5
104
  }
105
  },
106
  "Math": {
 
122
  "GPT-4.1 (April)": 59.5,
123
  "LLaMa 4 405B": 65.0,
124
  "Lugha-Llama 8B": 1.8,
125
+ "Gemini-2.5 Pro": 74.4,
126
  "Gemini-2.5 Flash": 70.6,
 
 
127
  "Claude 4.5 Sonnet": 73.1,
128
+ "Claude 3.7 Sonnet": 35.2,
129
+ "Claude 4.0 Sonnet": 66.9
130
  }
131
  },
132
  "Topic": {
 
148
  "GPT-4.1 (April)": 84.8,
149
  "LLaMa 4 405B": 80.6,
150
  "Lugha-Llama 8B": 34.1,
151
+ "Gemini-2.5 Pro": 88.1,
152
  "Gemini-2.5 Flash": 87.2,
 
 
153
  "Claude 4.5 Sonnet": 84.2,
154
+ "Claude 3.7 Sonnet": 84.9,
155
+ "Claude 4.0 Sonnet": 83.2
156
  }
157
  },
158
  "RC": {
 
174
  "GPT-4.1 (April)": 64.8,
175
  "LLaMa 4 405B": 24.6,
176
  "Lugha-Llama 8B": 23.0,
177
+ "Gemini-2.5 Pro": 76.7,
178
  "Gemini-2.5 Flash": 42.2,
 
 
179
  "Claude 4.5 Sonnet": 74.8,
180
+ "Claude 3.7 Sonnet": 65.1,
181
+ "Claude 4.0 Sonnet": 76.2
182
  }
183
  }
184
  }
data/leaderboard_json/lite_language_scores.json CHANGED
@@ -11,9 +11,9 @@
11
  "sot": 37.0,
12
  "swa": 53.3,
13
  "xho": 49.0,
 
14
  "yor": 42.0,
15
- "zul": 47.7,
16
- "wol": 29.2
17
  },
18
  "Gemma1.1 7b": {
19
  "amh": 19.0,
@@ -27,9 +27,9 @@
27
  "sot": 19.0,
28
  "swa": 35.0,
29
  "xho": 23.6,
 
30
  "yor": 22.3,
31
- "zul": 23.8,
32
- "wol": 22.7
33
  },
34
  "LLaMa2 7b": {
35
  "amh": 15.4,
@@ -43,9 +43,9 @@
43
  "sot": 12.5,
44
  "swa": 17.5,
45
  "xho": 15.8,
 
46
  "yor": 16.0,
47
- "zul": 15.7,
48
- "wol": 16.7
49
  },
50
  "LLaMa3 8B": {
51
  "amh": 15.9,
@@ -59,9 +59,9 @@
59
  "sot": 16.1,
60
  "swa": 20.3,
61
  "xho": 16.2,
 
62
  "yor": 16.5,
63
- "zul": 17.1,
64
- "wol": 16.0
65
  },
66
  "LLaMa3.1 8B": {
67
  "amh": 18.9,
@@ -75,9 +75,9 @@
75
  "sot": 13.5,
76
  "swa": 29.5,
77
  "xho": 18.1,
 
78
  "yor": 19.1,
79
- "zul": 18.9,
80
- "wol": 17.2
81
  },
82
  "LLaMAX3 8B": {
83
  "amh": 18.8,
@@ -91,9 +91,9 @@
91
  "sot": 13.7,
92
  "swa": 21.2,
93
  "xho": 19.2,
 
94
  "yor": 18.6,
95
- "zul": 19.1,
96
- "wol": 16.6
97
  },
98
  "Gemma2 9b": {
99
  "amh": 45.0,
@@ -107,9 +107,9 @@
107
  "sot": 26.9,
108
  "swa": 61.1,
109
  "xho": 39.9,
 
110
  "yor": 33.2,
111
- "zul": 38.8,
112
- "wol": 26.2
113
  },
114
  "Gemma2 27b": {
115
  "amh": 45.3,
@@ -123,9 +123,9 @@
123
  "sot": 32.9,
124
  "swa": 67.7,
125
  "xho": 44.6,
 
126
  "yor": 37.6,
127
- "zul": 45.2,
128
- "wol": 26.9
129
  },
130
  "LLaMa3.1 70B": {
131
  "amh": 33.9,
@@ -139,9 +139,9 @@
139
  "sot": 26.0,
140
  "swa": 57.0,
141
  "xho": 29.5,
 
142
  "yor": 29.4,
143
- "zul": 32.1,
144
- "wol": 25.1
145
  },
146
  "AfroLLaMa 8B": {
147
  "amh": 14.1,
@@ -155,9 +155,9 @@
155
  "sot": 10.9,
156
  "swa": 16.2,
157
  "xho": 15.1,
 
158
  "yor": 16.2,
159
- "zul": 15.5,
160
- "wol": 14.2
161
  },
162
  "Gemini 1.5 pro": {
163
  "amh": 75.3,
@@ -171,9 +171,9 @@
171
  "sot": 64.3,
172
  "swa": 70.9,
173
  "xho": 69.2,
 
174
  "yor": 62.3,
175
- "zul": 66.8,
176
- "wol": 29.7
177
  },
178
  "GPT-4o (Aug)": {
179
  "amh": 67.7,
@@ -187,9 +187,9 @@
187
  "sot": 67.6,
188
  "swa": 73.6,
189
  "xho": 70.8,
 
190
  "yor": 68.3,
191
- "zul": 69.3,
192
- "wol": 43.5
193
  },
194
  "Gemma 3 27b": {
195
  "amh": 61.2,
@@ -266,6 +266,21 @@
266
  "yor": 21.9,
267
  "zul": 20.6
268
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
269
  "Gemini-2.5 Flash": {
270
  "amh": 71.2,
271
  "hau": 67.1,
@@ -281,20 +296,20 @@
281
  "yor": 65.5,
282
  "zul": 69.4
283
  },
284
- "Claude 4.0 Sonnet": {
285
- "amh": 78.0,
286
- "hau": 73.9,
287
- "ibo": 71.8,
288
- "kin": 69.0,
289
- "lin": 62.9,
290
- "lug": 62.5,
291
- "orm": 65.6,
292
- "sna": 71.3,
293
- "sot": 70.2,
294
- "swa": 82.0,
295
- "xho": 74.2,
296
- "yor": 67.8,
297
- "zul": 72.4
298
  },
299
  "Claude 3.7 Sonnet": {
300
  "amh": 66.0,
@@ -311,34 +326,19 @@
311
  "yor": 57.9,
312
  "zul": 62.2
313
  },
314
- "Claude 4.5 Sonnet": {
315
- "amh": 81.9,
316
- "hau": 75.6,
317
- "ibo": 74.1,
318
- "kin": 71.1,
319
  "lin": 62.9,
320
- "lug": 68.5,
321
- "orm": 72.3,
322
- "sna": 75.1,
323
- "sot": 72.7,
324
- "swa": 82.9,
325
- "xho": 76.6,
326
- "yor": 75.0,
327
- "zul": 73.4
328
- },
329
- "Gemini 2.5 Pro": {
330
- "amh": 78.6,
331
- "hau": 72.6,
332
- "ibo": 73.9,
333
- "kin": 74.7,
334
- "lin": 68.4,
335
- "lug": 72.2,
336
- "orm": 75.3,
337
- "sna": 78.6,
338
- "sot": 72.9,
339
- "swa": 82.5,
340
- "xho": 78.3,
341
- "yor": 71.8,
342
- "zul": 76.7
343
  }
344
  }
 
11
  "sot": 37.0,
12
  "swa": 53.3,
13
  "xho": 49.0,
14
+ "wol": 29.2,
15
  "yor": 42.0,
16
+ "zul": 47.7
 
17
  },
18
  "Gemma1.1 7b": {
19
  "amh": 19.0,
 
27
  "sot": 19.0,
28
  "swa": 35.0,
29
  "xho": 23.6,
30
+ "wol": 22.7,
31
  "yor": 22.3,
32
+ "zul": 23.8
 
33
  },
34
  "LLaMa2 7b": {
35
  "amh": 15.4,
 
43
  "sot": 12.5,
44
  "swa": 17.5,
45
  "xho": 15.8,
46
+ "wol": 16.7,
47
  "yor": 16.0,
48
+ "zul": 15.7
 
49
  },
50
  "LLaMa3 8B": {
51
  "amh": 15.9,
 
59
  "sot": 16.1,
60
  "swa": 20.3,
61
  "xho": 16.2,
62
+ "wol": 16.0,
63
  "yor": 16.5,
64
+ "zul": 17.1
 
65
  },
66
  "LLaMa3.1 8B": {
67
  "amh": 18.9,
 
75
  "sot": 13.5,
76
  "swa": 29.5,
77
  "xho": 18.1,
78
+ "wol": 17.2,
79
  "yor": 19.1,
80
+ "zul": 18.9
 
81
  },
82
  "LLaMAX3 8B": {
83
  "amh": 18.8,
 
91
  "sot": 13.7,
92
  "swa": 21.2,
93
  "xho": 19.2,
94
+ "wol": 16.6,
95
  "yor": 18.6,
96
+ "zul": 19.1
 
97
  },
98
  "Gemma2 9b": {
99
  "amh": 45.0,
 
107
  "sot": 26.9,
108
  "swa": 61.1,
109
  "xho": 39.9,
110
+ "wol": 26.2,
111
  "yor": 33.2,
112
+ "zul": 38.8
 
113
  },
114
  "Gemma2 27b": {
115
  "amh": 45.3,
 
123
  "sot": 32.9,
124
  "swa": 67.7,
125
  "xho": 44.6,
126
+ "wol": 26.9,
127
  "yor": 37.6,
128
+ "zul": 45.2
 
129
  },
130
  "LLaMa3.1 70B": {
131
  "amh": 33.9,
 
139
  "sot": 26.0,
140
  "swa": 57.0,
141
  "xho": 29.5,
142
+ "wol": 25.1,
143
  "yor": 29.4,
144
+ "zul": 32.1
 
145
  },
146
  "AfroLLaMa 8B": {
147
  "amh": 14.1,
 
155
  "sot": 10.9,
156
  "swa": 16.2,
157
  "xho": 15.1,
158
+ "wol": 14.2,
159
  "yor": 16.2,
160
+ "zul": 15.5
 
161
  },
162
  "Gemini 1.5 pro": {
163
  "amh": 75.3,
 
171
  "sot": 64.3,
172
  "swa": 70.9,
173
  "xho": 69.2,
174
+ "wol": 29.7,
175
  "yor": 62.3,
176
+ "zul": 66.8
 
177
  },
178
  "GPT-4o (Aug)": {
179
  "amh": 67.7,
 
187
  "sot": 67.6,
188
  "swa": 73.6,
189
  "xho": 70.8,
190
+ "wol": 43.5,
191
  "yor": 68.3,
192
+ "zul": 69.3
 
193
  },
194
  "Gemma 3 27b": {
195
  "amh": 61.2,
 
266
  "yor": 21.9,
267
  "zul": 20.6
268
  },
269
+ "Gemini-2.5 Pro": {
270
+ "amh": 78.6,
271
+ "hau": 72.6,
272
+ "ibo": 73.9,
273
+ "kin": 74.7,
274
+ "lin": 68.4,
275
+ "lug": 72.2,
276
+ "orm": 75.3,
277
+ "sna": 78.6,
278
+ "sot": 72.9,
279
+ "swa": 82.5,
280
+ "xho": 78.3,
281
+ "yor": 71.8,
282
+ "zul": 76.7
283
+ },
284
  "Gemini-2.5 Flash": {
285
  "amh": 71.2,
286
  "hau": 67.1,
 
296
  "yor": 65.5,
297
  "zul": 69.4
298
  },
299
+ "Claude 4.5 Sonnet": {
300
+ "amh": 76.1,
301
+ "hau": 72.1,
302
+ "ibo": 69.8,
303
+ "kin": 67.9,
304
+ "lin": 60.8,
305
+ "lug": 64.6,
306
+ "orm": 67.9,
307
+ "sna": 70.9,
308
+ "sot": 69.4,
309
+ "swa": 79.6,
310
+ "xho": 73.0,
311
+ "yor": 68.5,
312
+ "zul": 70.5
313
  },
314
  "Claude 3.7 Sonnet": {
315
  "amh": 66.0,
 
326
  "yor": 57.9,
327
  "zul": 62.2
328
  },
329
+ "Claude 4.0 Sonnet": {
330
+ "amh": 78.0,
331
+ "hau": 73.9,
332
+ "ibo": 71.8,
333
+ "kin": 69.0,
334
  "lin": 62.9,
335
+ "lug": 62.5,
336
+ "orm": 65.6,
337
+ "sna": 71.3,
338
+ "sot": 70.2,
339
+ "swa": 82.0,
340
+ "xho": 74.2,
341
+ "yor": 67.8,
342
+ "zul": 72.4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
343
  }
344
  }