\n \n \n
\n
\n \n 2025\n \n \n (1)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n AFRIDOC-MT: Document-level MT Corpus for African Languages.\n \n \n \n\n\n \n Alabi, J. O; Azime, I. A.; Zhang, M.; España-Bonet, C.; Bawden, R.; Zhu, D.; Adelani, D. I.; Odoje, C. O.; Akinade, I.; Maab, I.; and others\n\n\n \n\n\n\n
arXiv preprint arXiv:2501.06374. 2025.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{alabi2025afridoc,\n title={AFRIDOC-MT: Document-level MT Corpus for African Languages},\n author={Alabi, Jesujoba O and Azime, Israel Abebe and Zhang, Miaoran and Espa{\\~n}a-Bonet, Cristina and Bawden, Rachel and Zhu, Dawei and Adelani, David Ifeoluwa and Odoje, Clement Oyeleke and Akinade, Idris and Maab, Iffat and others},\n journal={arXiv preprint arXiv:2501.06374},\n year={2025}\n}\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2024\n \n \n (7)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n Walia-LLM: Enhancing Amharic-LLaMA by Integrating Task-Specific and Generative Datasets.\n \n \n \n\n\n \n Azime, I. A.; Fuge, M. Y.; Tonja, A. L.; Belay, T. D.; Wassie, A. K.; Jada, E. S.; Chanie, Y.; Sewunetie, W. T.; and Yimam, S. M.\n\n\n \n\n\n\n
arXiv preprint arXiv:2402.08015. 2024.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{azime2024walia,\n title={Walia-LLM: Enhancing Amharic-LLaMA by Integrating Task-Specific and Generative Datasets},\n author={Azime, Israel Abebe and Fuge, Mitiku Yohannes and Tonja, Atnafu Lambebo and Belay, Tadesse Destaw and Wassie, Aman Kassahun and Jada, Eyasu Shiferaw and Chanie, Yonas and Sewunetie, Walelign Tewabe and Yimam, Seid Muhie},\n journal={arXiv preprint arXiv:2402.08015},\n year={2024}\n}\n\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n EthioLLM: Multilingual Large Language Models for Ethiopian Languages with Task Evaluation.\n \n \n \n\n\n \n Tonja, A. L.; Azime, I. A.; Belay, T. D.; Yigezu, M. G.; Mehamed, M. A.; Ayele, A. A.; Jibril, E. C.; Woldeyohannis, M. M.; Kolesnikova, O.; Slusallek, P.; and others\n\n\n \n\n\n\n
arXiv preprint arXiv:2403.13737. 2024.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{tonja2024ethiollm,\n title={EthioLLM: Multilingual Large Language Models for Ethiopian Languages with Task Evaluation},\n author={Tonja, Atnafu Lambebo and Azime, Israel Abebe and Belay, Tadesse Destaw and Yigezu, Mesay Gemeda and Mehamed, Moges Ahmed and Ayele, Abinew Ali and Jibril, Ebrahim Chekol and Woldeyohannis, Michael Melese and Kolesnikova, Olga and Slusallek, Philipp and others},\n journal={arXiv preprint arXiv:2403.13737},\n year={2024}\n}\n\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n IrokoBench: A New Benchmark for African Languages in the Age of Large Language Models.\n \n \n \n\n\n \n Adelani, D. I.; Ojo, J.; Azime, I. A.; Zhuang, J. Y.; Alabi, J. O; He, X.; Ochieng, M.; Hooker, S.; Bukula, A.; Lee, E. A.; and others\n\n\n \n\n\n\n
arXiv preprint arXiv:2406.03368. 2024.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{adelani2024irokobench,\n title={IrokoBench: A New Benchmark for African Languages in the Age of Large Language Models},\n author={Adelani, David Ifeoluwa and Ojo, Jessica and Azime, Israel Abebe and Zhuang, Jian Yun and Alabi, Jesujoba O and He, Xuanli and Ochieng, Millicent and Hooker, Sara and Bukula, Andiswa and Lee, En-Shiun Annie and others},\n journal={arXiv preprint arXiv:2406.03368},\n year={2024}\n}\n\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Cvqa: Culturally-diverse multilingual visual question answering benchmark.\n \n \n \n\n\n \n Romero, D.; Lyu, C.; Wibowo, H. A.; Lynn, T.; Hamed, I.; Kishore, A. N.; Mandal, A.; Dragonetti, A.; Abzaliev, A.; Tonja, A. L.; and others\n\n\n \n\n\n\n
arXiv preprint arXiv:2406.05967. 2024.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{romero2024cvqa,\n title={Cvqa: Culturally-diverse multilingual visual question answering benchmark},\n author={Romero, David and Lyu, Chenyang and Wibowo, Haryo Akbarianto and Lynn, Teresa and Hamed, Injy and Kishore, Aditya Nanda and Mandal, Aishik and Dragonetti, Alina and Abzaliev, Artem and Tonja, Atnafu Lambebo and others},\n journal={arXiv preprint arXiv:2406.05967},\n year={2024}\n}\n\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n ProverbEval: Exploring LLM Evaluation Challenges for Low-resource Language Understanding.\n \n \n \n\n\n \n Azime, I. A.; Tonja, A. L.; Belay, T. D.; Chanie, Y.; Balcha, B. F.; Abadi, N. H.; Ademtew, H. B.; Nerea, M. A.; Yadeta, D. D.; Geremew, D. D.; and others\n\n\n \n\n\n\n
arXiv preprint arXiv:2411.05049. 2024.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{azime2024proverbeval,\n title={ProverbEval: Exploring LLM Evaluation Challenges for Low-resource Language Understanding},\n author={Azime, Israel Abebe and Tonja, Atnafu Lambebo and Belay, Tadesse Destaw and Chanie, Yonas and Balcha, Bontu Fufa and Abadi, Negasi Haile and Ademtew, Henok Biadglign and Nerea, Mulubrhan Abebe and Yadeta, Debela Desalegn and Geremew, Derartu Dagne and others},\n journal={arXiv preprint arXiv:2411.05049},\n year={2024}\n}\n\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Uhura: A Benchmark for Evaluating Scientific Question Answering and Truthfulness in Low-Resource African Languages.\n \n \n \n\n\n \n Bayes, E.; Azime, I. A.; Alabi, J. O; Kgomo, J.; Eloundou, T.; Proehl, E.; Chen, K.; Khadir, I.; Etori, N. A; Muhammad, S. H.; and others\n\n\n \n\n\n\n
arXiv preprint arXiv:2412.00948. 2024.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{bayes2024uhura,\n title={Uhura: A Benchmark for Evaluating Scientific Question Answering and Truthfulness in Low-Resource African Languages},\n author={Bayes, Edward and Azime, Israel Abebe and Alabi, Jesujoba O and Kgomo, Jonas and Eloundou, Tyna and Proehl, Elizabeth and Chen, Kai and Khadir, Imaan and Etori, Naome A and Muhammad, Shamsuddeen Hassan and others},\n journal={arXiv preprint arXiv:2412.00948},\n year={2024}\n}\n\n
\n
\n\n\n\n
\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2023\n \n \n (3)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n Natural language processing in ethiopian languages: Current state, challenges, and opportunities.\n \n \n \n\n\n \n Tonja, A. L.; Belay, T. D.; Azime, I. A.; Ayele, A. A.; Mehamed, M. A.; Kolesnikova, O.; and Yimam, S. M.\n\n\n \n\n\n\n
arXiv preprint arXiv:2303.14406. 2023.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{tonja2023natural,\n title={Natural language processing in ethiopian languages: Current state, challenges, and opportunities},\n author={Tonja, Atnafu Lambebo and Belay, Tadesse Destaw and Azime, Israel Abebe and Ayele, Abinew Ali and Mehamed, Moges Ahmed and Kolesnikova, Olga and Yimam, Seid Muhie},\n journal={arXiv preprint arXiv:2303.14406},\n year={2023}\n}\n\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Masakhane-Afrisenti at SemEval-2023 Task 12: Sentiment Analysis using Afro-centric Language Models and Adapters for Low-resource African Languages.\n \n \n \n\n\n \n Azime, I. A.; Al-Azzawi, S. S.; Tonja, A. L.; Shode, I.; Alabi, J.; Awokoya, A.; Oduwole, M.; Adewumi, T.; Fanijo, S.; Awosan, O.; and others\n\n\n \n\n\n\n
arXiv preprint arXiv:2304.06459. 2023.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{azime2023masakhane,\n title={Masakhane-Afrisenti at SemEval-2023 Task 12: Sentiment Analysis using Afro-centric Language Models and Adapters for Low-resource African Languages},\n author={Azime, Israel Abebe and Al-Azzawi, Sana Sabah and Tonja, Atnafu Lambebo and Shode, Iyanuoluwa and Alabi, Jesujoba and Awokoya, Ayodele and Oduwole, Mardiyyah and Adewumi, Tosin and Fanijo, Samuel and Awosan, Oyinkansola and others},\n journal={arXiv preprint arXiv:2304.06459},\n year={2023}\n}\n\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Masakhanews: News topic classification for african languages.\n \n \n \n\n\n \n Adelani, D. I.; Masiak, M.; Azime, I. A.; Alabi, J.; Tonja, A. L.; Mwase, C.; Ogundepo, O.; Dossou, B. F.; Oladipo, A.; Nixdorf, D.; and others\n\n\n \n\n\n\n
arXiv preprint arXiv:2304.09972. 2023.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{adelani2023masakhanews,\n title={Masakhanews: News topic classification for african languages},\n author={Adelani, David Ifeoluwa and Masiak, Marek and Azime, Israel Abebe and Alabi, Jesujoba and Tonja, Atnafu Lambebo and Mwase, Christine and Ogundepo, Odunayo and Dossou, Bonaventure FP and Oladipo, Akintunde and Nixdorf, Doreen and others},\n journal={arXiv preprint arXiv:2304.09972},\n year={2023}\n}\n\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2022\n \n \n (1)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n Quality at a glance: An audit of web-crawled multilingual datasets.\n \n \n \n\n\n \n Kreutzer, J.; Caswell, I.; Wang, L.; Wahab, A.; van Esch, D.; Ulzii-Orshikh, N.; Tapo, A.; Subramani, N.; Sokolov, A.; Sikasote, C.; and others\n\n\n \n\n\n\n
Transactions of the Association for Computational Linguistics, 10: 50–72. 2022.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{kreutzer2022quality,\n title={Quality at a glance: An audit of web-crawled multilingual datasets},\n author={Kreutzer, Julia and Caswell, Isaac and Wang, Lisa and Wahab, Ahsan and van Esch, Daan and Ulzii-Orshikh, Nasanbayar and Tapo, Allahsera and Subramani, Nishant and Sokolov, Artem and Sikasote, Claytone and others},\n journal={Transactions of the Association for Computational Linguistics},\n volume={10},\n pages={50--72},\n year={2022},\n publisher={MIT Press One Rogers Street, Cambridge, MA 02142-1209, USA journals-info~…}\n}\n\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n 2021\n \n \n (2)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n An amharic news text classification dataset.\n \n \n \n\n\n \n Azime, I. A.; and Mohammed, N.\n\n\n \n\n\n\n
arXiv preprint arXiv:2103.05639. 2021.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{azime2021amharic,\n title={An amharic news text classification dataset},\n author={Azime, Israel Abebe and Mohammed, Nebil},\n journal={arXiv preprint arXiv:2103.05639},\n year={2021}\n}\n\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n MasakhaNER: Named entity recognition for African languages.\n \n \n \n\n\n \n Adelani, D. I.; Abbott, J.; Neubig, G.; D’souza, D.; Kreutzer, J.; Lignos, C.; Palen-Michel, C.; Buzaaba, H.; Rijhwani, S.; Ruder, S.; and others\n\n\n \n\n\n\n
Transactions of the Association for Computational Linguistics, 9: 1116–1131. 2021.\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{adelani2021masakhaner,\n title={MasakhaNER: Named entity recognition for African languages},\n author={Adelani, David Ifeoluwa and Abbott, Jade and Neubig, Graham and D’souza, Daniel and Kreutzer, Julia and Lignos, Constantine and Palen-Michel, Chester and Buzaaba, Happy and Rijhwani, Shruti and Ruder, Sebastian and others},\n journal={Transactions of the Association for Computational Linguistics},\n volume={9},\n pages={1116--1131},\n year={2021},\n publisher={MIT Press One Rogers Street, Cambridge, MA 02142-1209, USA journals-info~…}\n}\n\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n
\n
\n \n undefined\n \n \n (3)\n \n \n
\n
\n \n \n
\n
\n\n \n \n \n \n \n 5th Workshop on African Natural Language Processing (AfricaNLP 2024).\n \n \n \n\n\n \n Buzaaba, H.; Dossou, B. F.; Adelani, D. I.; Elsahar, H.; Lignos, C.; Tonja, A. L.; Osei, S.; Aremu, A.; Siro, C.; Muhammad, S. H.; and others\n\n\n \n\n\n\n In
ICLR 2024 Workshops, . \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{buzaaba20245th,\n title={5th Workshop on African Natural Language Processing (AfricaNLP 2024)},\n author={Buzaaba, Happy and Dossou, Bonaventure FP and Adelani, David Ifeoluwa and Elsahar, Hady and Lignos, Constantine and Tonja, Atnafu Lambebo and Osei, Salomey and Aremu, Anuoluwapo and Siro, Clemencia and Muhammad, Shamsuddeen Hassan and others},\n booktitle={ICLR 2024 Workshops}\n}\n\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n Nkiruka Odu, Rooweither Mabuya, Shamsuddeen Hassan Muhammad, Salomey Osei, Sokhar Samb, Tadesse Kebede Guge, and Pontus Stenetorp. 2024. Irokobench: A new benchmark for african languages in the age of large language models.\n \n \n \n\n\n \n Adelani, D. I.; Ojo, J.; Azime, I. A.; Zhuang, J. Y.; Alabi, J. O; He, X.; Ochieng, M.; Hooker, S.; Bukula, A.; Lee, E. A.; and others\n\n\n \n\n\n\n
Preprint. .\n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@article{adelaninkiruka,\n title={Nkiruka Odu, Rooweither Mabuya, Shamsuddeen Hassan Muhammad, Salomey Osei, Sokhar Samb, Tadesse Kebede Guge, and Pontus Stenetorp. 2024. Irokobench: A new benchmark for african languages in the age of large language models},\n author={Adelani, David Ifeoluwa and Ojo, Jessica and Azime, Israel Abebe and Zhuang, Jian Yun and Alabi, Jesujoba O and He, Xuanli and Ochieng, Millicent and Hooker, Sara and Bukula, Andiswa and Lee, En-Shiun Annie and others},\n journal={Preprint}\n}\n\n
\n
\n\n\n\n
\n\n\n
\n
\n\n \n \n \n \n \n CVQA: Culturally-diverse Multilingual Visual Question Answering Benchmark.\n \n \n \n\n\n \n Mogrovejo, D. O. R.; Lyu, C.; Wibowo, H. A.; Góngora, S.; Mandal, A.; Purkayastha, S.; Ortiz-Barajas, J.; Cueva, E. V.; Baek, J.; Jeong, S.; and others\n\n\n \n\n\n\n In
The Thirty-eight Conference on Neural Information Processing Systems Datasets and Benchmarks Track, . \n
\n\n
\n\n
\n\n
\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n
\n
@inproceedings{mogrovejocvqa,\n title={CVQA: Culturally-diverse Multilingual Visual Question Answering Benchmark},\n author={Mogrovejo, David Orlando Romero and Lyu, Chenyang and Wibowo, Haryo Akbarianto and G{\\'o}ngora, Santiago and Mandal, Aishik and Purkayastha, Sukannya and Ortiz-Barajas, Jesus-German and Cueva, Emilio Villa and Baek, Jinheon and Jeong, Soyeong and others},\n booktitle={The Thirty-eight Conference on Neural Information Processing Systems Datasets and Benchmarks Track}\n}\n\n
\n
\n\n\n\n
\n\n\n\n\n\n
\n
\n\n\n\n\n