@inproceedings{cettolo-etal-2008-shallow,
title = "Shallow-Syntax Phrase-Based Translation: Joint versus Factored String-to-Chunk Models",
author = "Cettolo, Mauro and
Federico, Marcello and
Pighin, Daniele and
Bertoldi, Nicola",
booktitle = "Proceedings of the 8th Conference of the Association for Machine Translation in the Americas: Research Papers",
month = oct # " 21-25",
year = "2008",
address = "Waikiki, USA",
publisher = "Association for Machine Translation in the Americas",
url = "https://aclanthology.org/2008.amta-papers.3",
pages = "56--64",
abstract = "This work extends phrase-based statistical MT (SMT) with shallow syntax dependencies. Two string-to-chunks translation models are proposed: a factored model, which augments phrase-based SMT with layered dependencies, and a joint model, that extends the phrase translation table with microtags, i.e. per-word projections of chunk labels. Both rely on n-gram models of target sequences with different granularity: single words, micro-tags, chunks. In particular, n-grams defined over syntactic chunks should model syntactic constraints coping with word-group movements. Experimental analysis and evaluation conducted on two popular Chinese-English tasks suggest that the shallow-syntax joint-translation model has potential to outperform state-of-the-art phrase-based translation, with a reasonable computational overhead.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="cettolo-etal-2008-shallow">
<titleInfo>
<title>Shallow-Syntax Phrase-Based Translation: Joint versus Factored String-to-Chunk Models</title>
</titleInfo>
<name type="personal">
<namePart type="given">Mauro</namePart>
<namePart type="family">Cettolo</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Marcello</namePart>
<namePart type="family">Federico</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Daniele</namePart>
<namePart type="family">Pighin</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Nicola</namePart>
<namePart type="family">Bertoldi</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2008-oct" 21-25"</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 8th Conference of the Association for Machine Translation in the Americas: Research Papers</title>
</titleInfo>
<originInfo>
<publisher>Association for Machine Translation in the Americas</publisher>
<place>
<placeTerm type="text">Waikiki, USA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>This work extends phrase-based statistical MT (SMT) with shallow syntax dependencies. Two string-to-chunks translation models are proposed: a factored model, which augments phrase-based SMT with layered dependencies, and a joint model, that extends the phrase translation table with microtags, i.e. per-word projections of chunk labels. Both rely on n-gram models of target sequences with different granularity: single words, micro-tags, chunks. In particular, n-grams defined over syntactic chunks should model syntactic constraints coping with word-group movements. Experimental analysis and evaluation conducted on two popular Chinese-English tasks suggest that the shallow-syntax joint-translation model has potential to outperform state-of-the-art phrase-based translation, with a reasonable computational overhead.</abstract>
<identifier type="citekey">cettolo-etal-2008-shallow</identifier>
<location>
<url>https://aclanthology.org/2008.amta-papers.3</url>
</location>
<part>
<date>2008-oct" 21-25"</date>
<extent unit="page">
<start>56</start>
<end>64</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Shallow-Syntax Phrase-Based Translation: Joint versus Factored String-to-Chunk Models
%A Cettolo, Mauro
%A Federico, Marcello
%A Pighin, Daniele
%A Bertoldi, Nicola
%S Proceedings of the 8th Conference of the Association for Machine Translation in the Americas: Research Papers
%D 2008
%8 oct" 21 25"
%I Association for Machine Translation in the Americas
%C Waikiki, USA
%F cettolo-etal-2008-shallow
%X This work extends phrase-based statistical MT (SMT) with shallow syntax dependencies. Two string-to-chunks translation models are proposed: a factored model, which augments phrase-based SMT with layered dependencies, and a joint model, that extends the phrase translation table with microtags, i.e. per-word projections of chunk labels. Both rely on n-gram models of target sequences with different granularity: single words, micro-tags, chunks. In particular, n-grams defined over syntactic chunks should model syntactic constraints coping with word-group movements. Experimental analysis and evaluation conducted on two popular Chinese-English tasks suggest that the shallow-syntax joint-translation model has potential to outperform state-of-the-art phrase-based translation, with a reasonable computational overhead.
%U https://aclanthology.org/2008.amta-papers.3
%P 56-64
Markdown (Informal)
[Shallow-Syntax Phrase-Based Translation: Joint versus Factored String-to-Chunk Models](https://aclanthology.org/2008.amta-papers.3) (Cettolo et al., AMTA 2008)
ACL