@inproceedings{faruqui-das-2018-identifying,
title = "Identifying Well-formed Natural Language Questions",
author = "Faruqui, Manaal and
Das, Dipanjan",
editor = "Riloff, Ellen and
Chiang, David and
Hockenmaier, Julia and
Tsujii, Jun{'}ichi",
booktitle = "Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing",
month = oct # "-" # nov,
year = "2018",
address = "Brussels, Belgium",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/Author-page-Marten-During-lu/D18-1091/",
doi = "10.18653/v1/D18-1091",
pages = "798--803",
abstract = "Understanding search queries is a hard problem as it involves dealing with {\textquotedblleft}word salad{\textquotedblright} text ubiquitously issued by users. However, if a query resembles a well-formed question, a natural language processing pipeline is able to perform more accurate interpretation, thus reducing downstream compounding errors. Hence, identifying whether or not a query is well formed can enhance query understanding. Here, we introduce a new task of identifying a well-formed natural language question. We construct and release a dataset of 25,100 publicly available questions classified into well-formed and non-wellformed categories and report an accuracy of 70.7{\%} on the test set. We also show that our classifier can be used to improve the performance of neural sequence-to-sequence models for generating questions for reading comprehension."
}
Markdown (Informal)
[Identifying Well-formed Natural Language Questions](https://preview.aclanthology.org/Author-page-Marten-During-lu/D18-1091/) (Faruqui & Das, EMNLP 2018)
ACL
- Manaal Faruqui and Dipanjan Das. 2018. Identifying Well-formed Natural Language Questions. In Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing, pages 798–803, Brussels, Belgium. Association for Computational Linguistics.