@inproceedings{habash-roth-2008-identification,
title = "Identification of Naturally Occurring Numerical Expressions in {A}rabic",
author = "Habash, Nizar and
Roth, Ryan",
booktitle = "Proceedings of the Sixth International Conference on Language Resources and Evaluation ({LREC}'08)",
month = may,
year = "2008",
address = "Marrakech, Morocco",
publisher = "European Language Resources Association (ELRA)",
url = "http://www.lrec-conf.org/proceedings/lrec2008/pdf/843_paper.pdf",
abstract = "In this paper, we define the task of Number Identification in natural context. We present and validate a language-independent semi-automatic approach to quickly building a gold standard for evaluating number identification systems by exploiting hand-aligned parallel data. We also present and extensively evaluate a robust rule-based system for number identification in natural context for Arabic for a variety of number formats and types. The system is shown to have strong performance, achieving, on a blind test, a 94.8{\%} F-score for the task of correctly identifying number expression spans in natural text, and a 92.1{\%} F-score for the task of correctly determining the core numerical value.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="habash-roth-2008-identification">
<titleInfo>
<title>Identification of Naturally Occurring Numerical Expressions in Arabic</title>
</titleInfo>
<name type="personal">
<namePart type="given">Nizar</namePart>
<namePart type="family">Habash</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Ryan</namePart>
<namePart type="family">Roth</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2008-may</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Sixth International Conference on Language Resources and Evaluation (LREC’08)</title>
</titleInfo>
<originInfo>
<publisher>European Language Resources Association (ELRA)</publisher>
<place>
<placeTerm type="text">Marrakech, Morocco</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>In this paper, we define the task of Number Identification in natural context. We present and validate a language-independent semi-automatic approach to quickly building a gold standard for evaluating number identification systems by exploiting hand-aligned parallel data. We also present and extensively evaluate a robust rule-based system for number identification in natural context for Arabic for a variety of number formats and types. The system is shown to have strong performance, achieving, on a blind test, a 94.8% F-score for the task of correctly identifying number expression spans in natural text, and a 92.1% F-score for the task of correctly determining the core numerical value.</abstract>
<identifier type="citekey">habash-roth-2008-identification</identifier>
<location>
<url>http://www.lrec-conf.org/proceedings/lrec2008/pdf/843_paper.pdf</url>
</location>
<part>
<date>2008-may</date>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Identification of Naturally Occurring Numerical Expressions in Arabic
%A Habash, Nizar
%A Roth, Ryan
%S Proceedings of the Sixth International Conference on Language Resources and Evaluation (LREC’08)
%D 2008
%8 may
%I European Language Resources Association (ELRA)
%C Marrakech, Morocco
%F habash-roth-2008-identification
%X In this paper, we define the task of Number Identification in natural context. We present and validate a language-independent semi-automatic approach to quickly building a gold standard for evaluating number identification systems by exploiting hand-aligned parallel data. We also present and extensively evaluate a robust rule-based system for number identification in natural context for Arabic for a variety of number formats and types. The system is shown to have strong performance, achieving, on a blind test, a 94.8% F-score for the task of correctly identifying number expression spans in natural text, and a 92.1% F-score for the task of correctly determining the core numerical value.
%U http://www.lrec-conf.org/proceedings/lrec2008/pdf/843_paper.pdf
Markdown (Informal)
[Identification of Naturally Occurring Numerical Expressions in Arabic](http://www.lrec-conf.org/proceedings/lrec2008/pdf/843_paper.pdf) (Habash & Roth, LREC 2008)
ACL