{ "task": "NLU", "subtasks": { "Senti": { "datasets": { "afrisenti": { "languages": [ "amh", "arq", "ary", "hau", "ibo", "kin", "orm", "pcm", "por", "swa", "tir", "tso", "twi", "yor" ], "scores": { "AfroLLaMa 8B": [ 14.8, 28.8, 37.3, 45.5, 36.4, 43.0, 41.8, 41.3, 58.6, 54.8, 20.5, 24.0, 26.0, 41.9 ], "LLaMAX3 8B": [ 55.2, 55.5, 51.0, 61.7, 54.6, 53.2, 33.6, 56.0, 41.3, 54.1, 43.5, 48.0, 39.0, 50.4 ], "LLaMa2 7b": [ 25.5, 44.9, 44.0, 38.2, 33.6, 35.4, 24.7, 60.8, 31.2, 33.8, 33.4, 46.1, 48.9, 43.7 ], "LLaMa3.1 70B": [ 40.0, 47.5, 53.5, 52.6, 52.2, 48.5, 41.4, 52.6, 35.8, 61.5, 28.2, 43.3, 45.8, 54.3 ], "LLaMa3.1 8B": [ 66.4, 57.1, 51.9, 55.4, 50.1, 48.7, 35.9, 64.2, 33.6, 54.3, 49.8, 48.8, 42.3, 50.9 ], "LLaMa3 8B": [ 46.3, 51.0, 46.1, 38.5, 36.1, 38.4, 28.2, 60.2, 27.9, 37.8, 38.0, 43.3, 47.7, 45.0 ], "Aya-101 13B": [ 76.8, 67.8, 58.1, 61.2, 47.5, 61.1, 37.4, 70.0, 48.8, 47.5, 71.2, 50.8, 44.7, 57.0 ], "Gemma1.1 7b": [ 24.4, 43.1, 42.0, 37.9, 34.7, 32.0, 25.9, 66.5, 37.4, 37.0, 32.4, 50.0, 48.7, 43.8 ], "Gemma2 27b": [ 70.7, 65.8, 59.0, 64.8, 60.4, 59.1, 37.3, 76.0, 42.8, 55.6, 58.8, 50.0, 54.3, 65.4 ], "Gemma2 9b": [ 70.1, 62.0, 56.4, 61.4, 58.2, 56.1, 37.9, 66.8, 46.6, 58.7, 55.4, 43.7, 48.0, 55.4 ], "Gemini 1.5 pro": [ 77.5, 70.9, 63.7, 70.1, 56.9, 68.3, 42.8, 74.5, 46.4, 55.2, 70.2, 55.9, 49.3, 74.3 ], "GPT-4o (Aug)": [ 75.6, 72.3, 61.2, 68.6, 67.8, 71.6, 43.1, 67.1, 62.1, 57.9, 61.5, 46.5, 51.3, 70.2 ] } }, "nollysenti": { "languages": [ "hau", "ibo", "pcm", "yor" ], "scores": { "AfroLLaMa 8B": [ 83.2, 56.6, 82.6, 78.2 ], "LLaMAX3 8B": [ 61.8, 57.0, 68.2, 49.8 ], "LLaMa2 7b": [ 50.2, 50.0, 69.2, 50.0 ], "LLaMa3.1 8B": [ 64.8, 62.8, 86.4, 45.8 ], "LLaMa3.1 70B": [ 66.8, 75.0, 93.0, 54.2 ], "LLaMa3 8B": [ 52.8, 50.0, 63.2, 50.0 ], "Aya-101 13B": [ 90.6, 88.4, 92.4, 81.6 ], "Gemma1.1 7b": [ 52.0, 50.4, 89.2, 49.4 ], "Gemma2 27b": [ 87.4, 90.6, 92.6, 73.2 ], "Gemma2 9b": [ 77.0, 76.6, 93.6, 67.6 ], "Gemini 1.5 pro": [ 89.2, 89.2, 94.6, 80.4 ], "GPT-4o (Aug)": [ 91.6, 92.4, 95.4, 89.2 ] } } } }, "Topic": { "datasets": { "masakhanews": { "languages": [ "amh", "hau", "ibo", "lin", "lug", "orm", "pcm", "run", "sna", "som", "swa", "tir", "xho", "yor" ], "scores": { "AfroLLaMa 8B": [ 17.6, 60.1, 49.2, 65.7, 59.2, 40.3, 68.2, 56.2, 58.3, 46.3, 56.1, 9.9, 50.2, 69.1 ], "LLaMAX3 8B": [ 35.1, 47.6, 43.3, 75.4, 49.8, 40.0, 52.1, 42.2, 39.6, 37.1, 41.8, 42.3, 45.8, 44.5 ], "LLaMa2 7b": [ 14.9, 36.4, 26.2, 52.0, 45.3, 33.8, 60.0, 45.0, 37.4, 43.9, 25.4, 12.5, 20.5, 48.4 ], "LLaMa3.1 70B": [ 84.6, 79.6, 86.2, 79.4, 74.4, 72.6, 94.8, 87.9, 69.9, 72.1, 79.2, 71.0, 68.4, 89.8 ], "LLaMa3.1 8B": [ 52.4, 70.8, 74.1, 78.9, 58.3, 45.2, 87.2, 79.5, 56.4, 59.5, 75.2, 27.9, 44.8, 79.8 ], "LLaMa3 8B": [ 55.6, 60.0, 63.1, 66.9, 57.4, 59.7, 63.9, 66.8, 66.1, 58.8, 71.8, 38.6, 49.2, 61.6 ], "Aya-101 13B": [ 88.0, 81.6, 80.0, 83.4, 84.8, 88.9, 96.1, 92.6, 78.9, 74.5, 80.7, 82.0, 93.6, 94.2 ], "Gemma1.1 7b": [ 28.5, 71.1, 69.0, 79.4, 61.4, 75.4, 86.9, 86.3, 71.8, 68.4, 72.5, 34.2, 81.5, 84.4 ], "Gemma2 9b": [ 79.5, 80.7, 84.6, 85.1, 78.9, 81.2, 92.1, 89.1, 77.2, 75.2, 79.0, 73.9, 85.9, 85.6 ], "Gemma2 27b": [ 81.4, 80.4, 86.2, 82.3, 66.8, 74.2, 92.5, 89.8, 75.3, 76.5, 80.2, 69.1, 67.0, 89.3 ], "Gemini 1.5 pro": [ 89.4, 81.8, 86.7, 85.1, 79.8, 86.5, 95.4, 91.0, 76.4, 81.0, 80.7, 83.5, 81.8, 92.2 ], "GPT-4o (Aug)": [ 87.2, 82.9, 85.6, 85.1, 81.2, 88.3, 95.7, 91.3, 74.8, 81.0, 80.9, 84.6, 85.2, 92.7 ] } }, "sib": { "languages": [ "aeb", "afr", "aka", "amh", "ary", "arz", "bam", "bem", "cjk", "dik", "dyu", "ewe", "fon", "fuv", "gaz", "hau", "ibo", "kab", "kam", "kea", "kbp", "kik", "kin", "kmb", "knc", "kon", "lin", "lua", "lug", "luo", "mos", "nso", "nus", "nya", "plt", "por", "run", "sag", "sot", "sna", "som", "ssw", "swa", "tir", "tso", "tum", "twi", "tzm", "umb", "wol", "xho", "yor", "zul" ], "scores": { "AfroLLaMa 8B": [ 34.5, 6.4, 29.2, 6.4, 6.5, 6.4, 6.4, 41.7, 33.0, 28.5, 29.6, 6.5, 7.3, 37.0, 21.5, 6.4, 6.4, 21.0, 43.6, 52.7, 25.5, 41.4, 6.4, 37.6, 34.6, 46.8, 6.4, 37.1, 33.9, 34.2, 32.4, 38.6, 17.3, 41.2, 33.2, 65.6, 40.4, 41.0, 39.7, 6.4, 6.4, 57.3, 6.4, 6.4, 6.4, 39.5, 32.0, 10.6, 35.9, 42.2, 6.4, 7.4, 6.4 ], "LLaMAX3 8B": [ 68.3, 75.9, 48.1, 39.2, 70.3, 67.7, 29.6, 47.4, 35.9, 40.3, 36.0, 41.2, 31.3, 36.4, 38.5, 67.4, 68.6, 21.1, 44.6, 67.6, 33.6, 44.6, 69.5, 37.1, 40.4, 55.2, 59.5, 50.6, 52.4, 37.9, 36.4, 55.5, 27.0, 67.7, 70.6, 67.3, 65.4, 44.0, 58.8, 67.0, 63.0, 61.3, 75.5, 27.6, 53.7, 60.1, 49.3, 3.8, 32.6, 54.1, 71.7, 57.0, 73.6 ], "LLaMa2 7b": [ 41.0, 21.7, 21.7, 16.9, 41.4, 41.3, 14.3, 25.1, 21.1, 21.0, 19.6, 19.0, 14.0, 24.0, 12.7, 14.4, 23.2, 10.6, 20.9, 20.0, 14.2, 27.9, 18.4, 10.3, 16.6, 28.8, 24.1, 18.5, 22.0, 15.9, 11.6, 19.5, 14.6, 24.0, 22.0, 32.7, 11.7, 24.3, 14.3, 20.1, 11.5, 15.0, 17.7, 15.8, 14.9, 21.5, 27.8, 9.7, 14.7, 13.5, 16.3, 20.5, 13.3 ], "LLaMa3.1 70B": [ 86.0, 85.5, 50.5, 68.4, 87.2, 84.6, 36.3, 50.2, 31.7, 31.9, 39.3, 35.5, 30.0, 46.4, 30.7, 75.6, 68.9, 13.3, 37.9, 79.9, 46.1, 50.2, 74.1, 36.5, 40.0, 57.0, 58.3, 37.6, 58.5, 33.4, 32.4, 55.8, 27.8, 60.0, 44.0, 86.8, 59.8, 37.8, 54.4, 59.0, 63.4, 45.8, 85.2, 51.1, 49.7, 52.1, 59.5, 4.9, 31.1, 58.3, 65.0, 53.0, 57.3 ], "LLaMa3.1 8B": [ 75.3, 76.6, 46.2, 36.6, 78.0, 73.4, 37.4, 36.6, 39.5, 34.7, 36.0, 33.8, 34.0, 33.4, 39.8, 57.6, 44.0, 26.4, 28.1, 73.4, 36.8, 37.5, 49.0, 38.1, 40.1, 49.1, 47.2, 43.2, 39.1, 34.6, 34.4, 48.8, 25.7, 44.8, 47.3, 80.4, 41.9, 38.4, 47.9, 42.7, 49.1, 45.3, 66.2, 17.8, 42.7, 44.5, 49.9, 10.0, 36.8, 53.8, 45.4, 45.8, 48.9 ], "LLaMa3 8B": [ 63.9, 53.1, 39.5, 11.9, 67.3, 68.8, 33.5, 37.1, 30.3, 30.8, 30.4, 28.5, 21.6, 30.7, 21.5, 46.9, 43.3, 20.8, 33.2, 55.1, 22.8, 38.0, 45.7, 29.7, 31.6, 42.1, 44.8, 34.8, 34.2, 30.6, 34.6, 36.1, 24.5, 39.9, 18.5, 79.0, 42.4, 35.0, 38.8, 42.7, 44.2, 40.0, 66.3, 11.9, 32.8, 37.8, 38.8, 10.0, 30.2, 43.4, 33.4, 30.5, 40.0 ], "Aya-101 13B": [ 79.5, 83.0, 72.3, 79.7, 82.9, 83.6, 54.3, 67.1, 49.9, 45.4, 53.7, 54.2, 45.8, 50.8, 67.5, 82.8, 82.0, 35.8, 55.7, 81.3, 51.8, 61.3, 79.2, 55.4, 56.6, 66.3, 69.7, 56.7, 62.9, 57.7, 48.2, 80.2, 41.6, 81.5, 85.3, 83.6, 78.6, 57.9, 80.6, 82.4, 82.0, 76.7, 79.9, 79.0, 70.2, 74.1, 70.5, 26.5, 49.8, 58.3, 80.5, 76.5, 80.8 ], "Gemma1.1 7b": [ 71.7, 75.2, 42.3, 23.1, 71.9, 71.9, 37.7, 44.2, 37.4, 38.0, 45.0, 36.6, 27.6, 43.6, 33.3, 46.1, 48.8, 24.4, 43.1, 69.6, 34.7, 42.0, 38.7, 33.6, 44.6, 46.6, 43.5, 43.6, 38.7, 40.9, 38.3, 40.0, 29.1, 46.6, 49.4, 74.3, 35.5, 41.1, 44.6, 38.2, 39.5, 36.4, 57.0, 15.5, 38.6, 40.8, 41.0, 13.4, 31.0, 51.0, 50.6, 33.4, 41.2 ], "Gemma2 27b": [ 80.7, 82.6, 58.3, 75.0, 83.3, 83.4, 40.6, 60.7, 38.2, 37.5, 48.9, 40.7, 34.3, 47.1, 37.4, 71.7, 75.2, 27.8, 44.6, 81.9, 45.8, 56.2, 74.4, 43.5, 46.6, 56.4, 55.3, 43.4, 54.2, 39.7, 35.4, 65.6, 30.9, 64.7, 63.4, 83.4, 62.9, 43.7, 67.6, 72.6, 70.2, 55.5, 85.6, 61.7, 56.4, 65.1, 65.0, 10.5, 45.0, 56.9, 71.6, 62.2, 72.6 ], "Gemma2 9b": [ 79.3, 79.5, 55.3, 67.2, 79.2, 82.2, 38.3, 53.3, 45.6, 47.2, 47.1, 44.0, 32.4, 45.9, 41.9, 68.6, 70.2, 28.1, 45.5, 78.2, 43.9, 54.4, 68.3, 41.9, 39.2, 57.0, 52.9, 50.9, 55.7, 52.5, 39.4, 57.7, 28.6, 68.8, 60.2, 81.0, 58.1, 47.2, 65.1, 65.7, 67.3, 57.1, 79.6, 55.3, 57.6, 64.5, 61.6, 5.7, 42.1, 56.2, 67.3, 65.7, 71.3 ], "Gemini 1.5 pro": [ 87.2, 87.2, 80.4, 87.2, 87.8, 87.2, 60.3, 80.4, 56.9, 53.9, 60.3, 73.0, 60.8, 60.8, 81.4, 85.8, 81.9, 57.8, 63.7, 87.2, 68.1, 74.0, 84.3, 66.2, 51.0, 79.4, 87.8, 70.6, 78.9, 56.9, 52.0, 86.3, 46.1, 83.3, 85.3, 89.2, 81.4, 72.6, 86.3, 83.3, 86.8, 80.4, 59.8, 82.8, 81.4, 81.9, 82.4, 45.6, 61.3, 63.2, 86.3, 85.3, 86.8 ], "GPT-4o (Aug)": [ 87.2, 87.8, 76.5, 85.8, 88.7, 86.3, 57.8, 77.0, 54.4, 47.6, 59.8, 52.0, 45.6, 64.7, 85.8, 85.3, 83.3, 50.5, 73.0, 86.3, 47.6, 75.5, 84.8, 53.4, 57.4, 77.4, 86.3, 61.8, 81.4, 78.9, 43.6, 86.3, 46.1, 84.8, 77.4, 88.7, 85.3, 56.9, 83.8, 86.3, 85.8, 83.3, 58.3, 80.9, 85.8, 81.4, 77.9, 12.8, 59.3, 79.9, 87.8, 85.3, 87.8 ] } } } }, "NER": { "datasets": { "masakhaner": { "languages": [ "am", "bbj", "bm", "ee", "ha", "ig", "lg", "luo", "mos", "ny", "pcm", "rw", "sn", "sw", "tn", "tw", "wo", "xh", "yo", "zu" ], "scores": { "AfroLLaMa 8B": [ 0.0, 1.5, 1.3, 4.4, 5.7, 2.4, 6.0, 4.2, 0.8, 4.2, 4.1, 3.3, 2.7, 13.9, 2.9, 1.4, 1.3, 5.2, 2.1, 2.7 ], "LLaMAX3 8B": [ 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "LLaMa2 7b": [ 1.7, 13.1, 15.2, 26.8, 19.6, 18.5, 22.3, 19.9, 11.2, 18.5, 25.6, 13.2, 9.2, 24.8, 17.1, 11.5, 13.0, 7.2, 15.8, 6.8 ], "LLaMa3.1 70B": [ 1.7, 4.7, 8.3, 19.6, 24.6, 14.8, 21.9, 20.4, 8.3, 19.6, 19.6, 19.1, 9.0, 27.2, 18.6, 10.8, 13.9, 6.6, 12.5, 7.4 ], "LLaMa3.1 8B": [ 6.2, 6.0, 10.2, 11.2, 17.8, 10.9, 16.4, 11.7, 7.6, 17.7, 14.7, 15.0, 6.9, 22.3, 13.5, 8.1, 14.4, 5.0, 9.6, 5.0 ], "LLaMa3 8B": [ 1.6, 18.2, 20.8, 27.0, 33.4, 25.6, 32.2, 22.7, 15.1, 32.9, 25.8, 29.1, 15.4, 37.5, 24.6, 22.1, 22.2, 10.6, 22.7, 14.4 ], "Aya-101 13B": [ 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "Gemma1.1 7b": [ 1.2, 20.9, 23.0, 41.2, 29.8, 32.9, 37.3, 28.2, 17.7, 38.7, 38.0, 29.5, 22.8, 44.2, 36.7, 26.6, 24.3, 17.5, 26.7, 20.2 ], "Gemma2 27b": [ 30.4, 45.7, 46.1, 69.8, 58.0, 53.8, 64.8, 46.3, 47.4, 56.8, 61.7, 53.2, 30.5, 67.8, 64.4, 56.6, 51.9, 25.1, 53.1, 33.4 ], "Gemma2 9b": [ 17.3, 26.5, 30.9, 61.6, 51.6, 39.3, 55.0, 39.8, 30.1, 53.2, 52.8, 47.3, 28.7, 65.1, 50.0, 39.6, 38.7, 23.8, 29.8, 24.3 ], "Gemini 1.5 pro": [ 23.6, 28.0, 33.1, 69.9, 54.1, 42.4, 65.4, 39.2, 25.3, 56.7, 47.5, 45.0, 32.2, 66.8, 57.1, 22.8, 37.3, 25.6, 34.7, 28.8 ], "GPT-4o (Aug)": [ 18.3, 34.7, 30.8, 68.7, 50.9, 38.1, 63.5, 47.4, 26.1, 53.5, 42.5, 42.2, 34.7, 63.8, 56.3, 22.2, 36.0, 21.6, 32.5, 30.7 ] } } } }, "NLI": { "datasets": { "afrixnli": { "languages": [ "amh", "ewe", "hau", "ibo", "kin", "lin", "lug", "orm", "sna", "sot", "swa", "twi", "wol", "xho", "yor", "zul" ], "scores": { "Aya-101 13B": [ 64.2, 43.2, 57.0, 55.5, 54.3, 33.5, 51.7, 51.5, 55.7, 52.2, 56.5, 47.0, 36.7, 55.2, 54.5, 55.3 ], "Gemma1.1 7b": [ 33.8, 32.8, 35.2, 35.3, 33.8, 33.8, 33.7, 33.8, 34.2, 35.2, 40.7, 33.7, 33.3, 34.0, 33.7, 34.0 ], "LLaMa2 7b": [ 33.3, 34.7, 33.7, 33.5, 35.2, 33.2, 33.5, 34.3, 33.0, 34.0, 34.7, 34.2, 34.5, 35.5, 33.2, 30.3 ], "LLaMa3 8B": [ 40.2, 34.3, 35.6, 39.1, 32.9, 32.7, 33.3, 35.4, 35.5, 35.9, 34.1, 34.3, 33.3, 36.8, 35.2, 38.5 ], "LLaMa3.1 8B": [ 38.8, 37.7, 36.5, 38.5, 38.3, 32.3, 37.5, 35.0, 35.8, 34.8, 43.8, 37.0, 32.3, 33.8, 38.5, 34.0 ], "LLaMAX3 8B": [ 40.2, 35.8, 44.8, 42.5, 37.7, 29.8, 42.7, 40.5, 47.0, 39.7, 45.7, 36.3, 37.3, 46.2, 44.0, 42.0 ], "Gemma2 9b": [ 43.2, 35.3, 47.0, 40.7, 40.2, 32.8, 38.8, 37.8, 42.3, 40.2, 46.3, 37.2, 35.2, 42.5, 41.3, 44.5 ], "Gemma2 27b": [ 47.0, 36.8, 49.7, 46.2, 40.5, 32.0, 41.7, 35.8, 46.0, 43.5, 57.0, 36.0, 36.7, 45.0, 42.5, 48.0 ], "LLaMa3.1 70B": [ 43.2, 34.3, 42.8, 42.3, 36.5, 32.8, 37.5, 34.7, 35.5, 38.3, 44.0, 36.0, 34.7, 39.3, 39.0, 37.0 ], "AfroLLaMa 8B": [ 33.0, 32.7, 40.7, 35.8, 32.7, 33.5, 32.3, 34.2, 34.0, 33.3, 39.7, 33.0, 37.0, 41.8, 42.0, 38.3 ], "Gemini 1.5 pro": [ 75.3, 47.5, 73.3, 68.2, 64.8, 33.2, 64.8, 61.3, 73.7, 68.5, 68.3, 54.5, 42.3, 69.3, 61.8, 65.0 ], "GPT-4o (Aug)": [ 71.8, 45.0, 75.2, 68.2, 68.0, 32.7, 69.8, 71.2, 71.3, 71.8, 71.5, 55.8, 52.7, 72.0, 64.5, 67.5 ] } } } }, "Intent": { "datasets": { "injongointent": { "languages": [ "amh", "ewe", "hau", "ibo", "kin", "lin", "lug", "orm", "sna", "sot", "swa", "twi", "wol", "xho", "yor", "zul" ], "scores": { "AfroLLaMa 8B": [ 0.2, 0.1, 1.9, 0.3, 0.4, 0.4, 0.1, 0.1, 0.2, 0.1, 4.2, 0.1, 0.1, 1.8, 2.2, 1.0 ], "LLaMAX3 8B": [ 6.1, 0.7, 10.1, 10.9, 3.0, 3.5, 2.6, 2.7, 4.0, 3.8, 15.9, 1.5, 2.7, 8.2, 1.9, 12.3 ], "LLaMa2 7b": [ 0.4, 1.1, 1.1, 2.1, 0.5, 4.5, 1.5, 0.6, 1.7, 0.1, 1.7, 2.1, 3.5, 0.4, 0.3, 1.8 ], "LLaMa3.1 70B": [ 43.6, 8.3, 61.5, 53.7, 34.2, 34.9, 26.8, 12.1, 24.8, 23.1, 82.2, 19.0, 21.3, 32.1, 36.4, 30.5 ], "LLaMa3.1 8B": [ 4.4, 3.6, 7.3, 7.7, 4.0, 4.4, 3.4, 1.1, 3.4, 5.0, 26.9, 5.1, 4.0, 5.9, 4.7, 5.7 ], "LLaMa3 8B": [ 0.1, 1.3, 1.4, 4.1, 2.9, 4.6, 0.4, 0.1, 1.4, 2.4, 9.7, 0.1, 0.6, 1.9, 0.1, 2.5 ], "Gemma1.1 7b": [ 2.2, 2.1, 9.2, 12.1, 7.1, 19.8, 4.9, 3.5, 4.4, 11.6, 36.9, 6.8, 5.8, 8.2, 7.7, 8.9 ], "Gemma2 27b": [ 44.3, 47.2, 6.3, 46.5, 36.9, 26.7, 27.5, 26.1, 5.8, 36.7, 25.6, 75.5, 21.2, 16.4, 50.2, 34.8 ], "Gemma2 9b": [ 36.3, 49.2, 6.1, 40.8, 31.5, 23.8, 22.2, 23.2, 7.7, 29.7, 19.9, 70.0, 21.0, 13.8, 40.1, 32.2 ], "Aya-101 13B": [ 62.9, 13.4, 57.8, 56.9, 40.4, 27.8, 33.9, 20.8, 51.2, 43.9, 65.9, 27.2, 19.7, 58.1, 45.9, 53.2 ], "Gemini 1.5 pro": [ 86.2, 49.3, 87.0, 78.3, 75.2, 77.3, 77.8, 64.7, 83.6, 69.8, 88.9, 71.4, 37.8, 85.2, 80.3, 76.4 ], "GPT-4o (Aug)": [ 77.5, 21.1, 89.7, 79.4, 74.4, 76.2, 78.0, 69.5, 84.7, 70.6, 90.3, 66.7, 61.4, 85.2, 81.2, 78.1 ] } } } }, "Hate": { "datasets": { "afrihate": { "languages": [ "amh", "arq", "ary", "hau", "ibo", "kin", "orm", "pcm", "som", "swa", "tir", "twi", "xho", "yor", "zul" ], "scores": { "Gemma1.1 7b": [ 23.0, 27.4, 24.5, 26.0, 16.7, 29.9, 27.9, 30.2, 27.2, 27.4, 17.3, 14.2, 23.3, 25.0, 22.5 ], "LLaMa2 7b": [ 14.5, 22.4, 22.2, 24.4, 20.2, 22.4, 31.3, 9.4, 27.1, 24.8, 11.7, 15.8, 24.8, 23.1, 26.8 ], "LLaMa3 8B": [ 26.5, 31.8, 28.5, 24.5, 19.7, 36.5, 37.1, 38.8, 17.8, 34.3, 28.4, 14.4, 25.0, 25.9, 28.4 ], "LLaMAX3 8B": [ 37.2, 33.6, 31.5, 30.7, 19.4, 38.2, 38.2, 34.4, 27.6, 28.9, 27.4, 13.9, 23.7, 24.4, 29.0 ], "LLaMa3.1 8B": [ 23.3, 30.7, 22.9, 25.4, 13.9, 31.9, 35.7, 24.9, 26.7, 21.7, 21.9, 9.9, 22.4, 19.4, 23.3 ], "AfroLLaMa 8B": [ 14.3, 16.5, 17.8, 24.1, 12.4, 21.9, 19.4, 18.9, 24.4, 20.6, 11.7, 8.8, 21.2, 18.4, 21.6 ], "Gemma2 9b": [ 33.2, 33.8, 33.2, 24.1, 25.1, 33.6, 26.7, 54.9, 13.6, 46.4, 26.8, 29.1, 20.0, 30.5, 20.1 ], "Aya-101 13B": [ 39.3, 33.6, 29.9, 34.3, 20.9, 37.9, 34.8, 36.9, 38.3, 35.7, 36.8, 13.2, 26.4, 27.1, 28.7 ], "Gemma2 27b": [ 48.4, 49.1, 53.8, 34.8, 42.8, 52.7, 39.8, 60.9, 39.6, 70.9, 35.4, 38.1, 30.6, 54.0, 35.0 ], "LLaMa3.1 70B": [ 53.0, 57.0, 60.6, 41.2, 48.4, 50.9, 44.6, 62.4, 39.8, 67.0, 41.0, 37.9, 32.7, 56.2, 46.3 ], "Gemini 1.5 pro": [ 56.1, 70.6, 68.2, 61.4, 66.9, 64.2, 57.6, 65.0, 60.8, 80.5, 37.5, 50.6, 58.0, 73.1, 55.4 ], "GPT-4o (Aug)": [ 56.0, 69.7, 75.5, 59.2, 69.7, 60.1, 53.5, 65.2, 68.5, 78.0, 42.4, 51.2, 63.7, 74.5, 58.7 ] } } } }, "POS": { "datasets": { "masakhapos": { "languages": [ "bam", "bbj", "ewe", "fon", "hau", "ibo", "kin", "lug", "luo", "mos", "nya", "pcm", "sna", "swa", "tsn", "twi", "wol", "xho", "yor", "zul" ], "scores": { "AfroLLaMa 8B": [ 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "LLaMAX3 8B": [ 31.7, 25.4, 43.9, 25.8, 41.2, 40.4, 44.6, 45.2, 28.7, 37.7, 47.8, 54.2, 50.3, 48.9, 49.2, 37.4, 34.1, 52.4, 41.2, 50.9 ], "LLaMa2 7b": [ 27.3, 22.0, 34.8, 23.5, 25.5, 26.4, 25.0, 31.9, 22.6, 26.9, 31.8, 40.6, 30.7, 36.3, 24.8, 21.1, 19.1, 31.3, 25.7, 31.0 ], "LLaMa3.1 70B": [ 42.6, 27.2, 54.6, 37.0, 63.1, 54.2, 44.6, 49.6, 36.9, 43.7, 65.7, 78.6, 66.6, 65.2, 52.2, 51.0, 48.0, 68.6, 60.9, 71.6 ], "LLaMa3.1 8B": [ 34.2, 25.2, 46.0, 27.7, 57.6, 44.9, 39.4, 45.8, 32.8, 40.7, 55.3, 71.8, 57.7, 61.8, 49.4, 42.3, 37.6, 58.0, 48.9, 64.2 ], "LLaMa3 8B": [ 38.2, 25.0, 48.8, 33.5, 55.8, 45.0, 40.6, 44.0, 34.4, 41.6, 58.8, 76.0, 58.4, 61.4, 47.6, 44.9, 43.6, 56.7, 50.4, 65.2 ], "Aya-101 13B": [ 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 ], "Gemma1.1 7b": [ 34.9, 22.6, 39.2, 27.8, 37.9, 38.0, 39.1, 45.3, 27.2, 33.3, 38.3, 65.5, 42.8, 48.6, 40.3, 34.8, 28.8, 45.1, 37.2, 46.0 ], "Gemma2 27b": [ 38.4, 27.4, 52.0, 35.7, 61.3, 57.2, 45.4, 50.3, 37.9, 43.0, 67.2, 81.9, 72.7, 66.2, 58.5, 57.3, 48.7, 68.0, 61.8, 70.8 ], "Gemma2 9b": [ 39.2, 27.2, 50.8, 34.0, 58.0, 51.2, 47.4, 50.2, 34.9, 44.9, 60.8, 77.2, 68.0, 63.9, 51.9, 53.8, 41.7, 62.7, 54.8, 65.2 ], "Gemini 1.5 pro": [ 45.8, 30.1, 65.7, 56.0, 64.0, 55.1, 46.7, 51.0, 44.9, 54.7, 74.5, 85.0, 77.1, 66.5, 57.3, 61.9, 66.9, 70.2, 65.9, 76.0 ], "GPT-4o (Aug)": [ 47.8, 31.6, 67.7, 46.9, 64.9, 56.6, 47.2, 52.6, 58.7, 49.5, 74.7, 84.9, 79.6, 68.2, 60.2, 63.6, 83.0, 70.5, 70.4, 76.9 ] } } } } } }