@inproceedings{lin-etal-2004-extraction,
title = "Extraction of name and transliteration in monolingual and parallel corpora",
author = "Lin, Tracy and
Wu, Jian-Cheng and
Chang, Jason S.",
editor = "Frederking, Robert E. and
Taylor, Kathryn B.",
booktitle = "Proceedings of the 6th Conference of the Association for Machine Translation in the Americas: Technical Papers",
month = sep # " 28 - " # oct # " 2",
year = "2004",
address = "Washington, USA",
publisher = "Springer",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2004.amta-papers.20/",
pages = "177--186",
abstract = "Named-entities in free text represent a challenge to text analysis in Machine Translation and Cross Language Information Retrieval. These phrases are often transliterated into another language with a different sound inventory and writing system. Named-entities found in free text are often not listed in bilingual dictionaries. Although it is possible to identify and translate named-entities on the fly without a list of proper names and transliterations, an extensive list of existing transliterations certainly will ensure high precision rate. We use a seed list of proper names and transliterations to train a Machine Transliteration Model. With the model it is possible to extract proper names and their transliterations in monolingual or parallel corpora with high precision and recall rates."
}
Markdown (Informal)
[Extraction of name and transliteration in monolingual and parallel corpora](https://preview.aclanthology.org/jlcl-multiple-ingestion/2004.amta-papers.20/) (Lin et al., AMTA 2004)
ACL