@inproceedings{lee-etal-2020-counselling,
title = "A Counselling Corpus in {C}antonese",
author = "Lee, John and
Cai, Tianyuan and
Xie, Wenxiu and
Xing, Lam",
editor = "Beermann, Dorothee and
Besacier, Laurent and
Sakti, Sakriani and
Soria, Claudia",
booktitle = "Proceedings of the 1st Joint Workshop on Spoken Language Technologies for Under-resourced languages (SLTU) and Collaboration and Computing for Under-Resourced Languages (CCURL)",
month = may,
year = "2020",
address = "Marseille, France",
publisher = "European Language Resources association",
url = "https://preview.aclanthology.org/Add-Cong-Liu-Florida-Atlantic-University-author-id/2020.sltu-1.50/",
pages = "358--361",
language = "eng",
ISBN = "979-10-95546-35-1",
abstract = "Virtual agents are increasingly used for delivering health information in general, and mental health assistance in particular. This paper presents a corpus designed for training a virtual counsellor in Cantonese, a variety of Chinese. The corpus consists of a domain-independent subcorpus that supports small talk for rapport building with users, and a domain-specific subcorpus that provides material for a particular area of counselling. The former consists of ELIZA style responses, chitchat expressions, and a dataset of general dialog, all of which are reusable across counselling domains. The latter consists of example user inputs and appropriate chatbot replies relevant to the specific domain. In a case study, we created a chatbot with a domain-specific subcorpus that addressed 25 issues in test anxiety, with 436 inputs solicited from native speakers of Cantonese and 150 chatbot replies harvested from mental health websites. Preliminary evaluations show that Word Mover`s Distance achieved 56{\%} accuracy in identifying the issue in user input, outperforming a number of baselines."
}
Markdown (Informal)
[A Counselling Corpus in Cantonese](https://preview.aclanthology.org/Add-Cong-Liu-Florida-Atlantic-University-author-id/2020.sltu-1.50/) (Lee et al., SLTU 2020)
ACL
- John Lee, Tianyuan Cai, Wenxiu Xie, and Lam Xing. 2020. A Counselling Corpus in Cantonese. In Proceedings of the 1st Joint Workshop on Spoken Language Technologies for Under-resourced languages (SLTU) and Collaboration and Computing for Under-Resourced Languages (CCURL), pages 358–361, Marseille, France. European Language Resources association.