@inproceedings{breiding-akbik-2026-using,
title = "Using Subword-Embeddings for Bilingual Lexicon Induction in {B}antu Languages",
author = "Breiding, Adrian and
Akbik, Alan",
editor = "Chimoto, Everlyn Asiko and
Lignos, Constantine and
Muhammad, Shamsuddeen and
Abdulmumin, Idris and
Siro, Clemencia and
Adelani, David Ifeoluwa",
booktitle = "Proceedings of the 7th Workshop on {A}frican Natural Language Processing ({A}frica{NLP} 2026)",
month = mar,
year = "2026",
address = "Rabat, Morocco",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/manual-author-scripts/2026.africanlp-main.29/",
pages = "271--280",
ISBN = "979-8-89176-364-7",
abstract = "Bilingual Lexicon Induction (BLI) is a valuable tool in machine translation and cross-lingual transfer learning, but it remains challenging for agglutinative and low-resource languages. In this work, we investigate the use of weighted sub-word embeddings in BLI for agglutinative languages. We further evaluate a graph-matching and Procrustes-based BLI approach on two Bantu languages, assessing its effectiveness in a previously underexplored language family. Our results for Swahili with an average P@1 score of 51.84{\%} for a 3000 word dictionary demonstrate the success of the approach for Bantu languages. Weighted sub-word embeddings perform competitively on Swahili and outperform word embeddings in our experiments with Zulu."
}Markdown (Informal)
[Using Subword-Embeddings for Bilingual Lexicon Induction in Bantu Languages](https://preview.aclanthology.org/manual-author-scripts/2026.africanlp-main.29/) (Breiding & Akbik, AfricaNLP 2026)
ACL