@inproceedings{zhang-etal-2005-building-annotated,
title = "Building an Annotated {J}apanese-{C}hinese Parallel Corpus {--} A Part of {NICT} Multilingual Corpora",
author = "Zhang, Yujie and
Uchimoto, Kiyotaka and
Ma, Qing and
Isahara, Hitoshi",
booktitle = "Proceedings of Machine Translation Summit X: Papers",
month = sep # " 13-15",
year = "2005",
address = "Phuket, Thailand",
url = "https://preview.aclanthology.org/jlcl-multiple-ingestion/2005.mtsummit-papers.10/",
pages = "71--78",
abstract = "We are constricting a Japanese-Chinese parallel corpus, which is a part of the NICT Multilingual Corpora. The corpus is general domain, of large scale of about 40,000 sentence pairs, long sentences, annotated with detailed information and high quality. To the best of our knowledge, this will be the first annotated Japanese-Chinese parallel corpus in the world. We created the corpus by selecting Japanese sentences from Mainichi Newspaper and then manually translating them into Chinese. We then annotated the corpus with morphological and syntactic structures and alignments at word and phrase levels. This paper describes the specification in human translation and detailed information annotation, and the tools we developed in the project. The experience we obtained and points we paid special attentions are also introduced for share with other researches in corpora construction."
}
Markdown (Informal)
[Building an Annotated Japanese-Chinese Parallel Corpus – A Part of NICT Multilingual Corpora](https://preview.aclanthology.org/jlcl-multiple-ingestion/2005.mtsummit-papers.10/) (Zhang et al., MTSummit 2005)
ACL