@inproceedings{boccardo-feltrim-2026-automatic,
title = "Automatic Question classification in {P}ortuguese: A Large-Scale Dataset and Comparative Evaluation of Classification Strategies",
author = "Boccardo, Murilo and
Feltrim, Val{\'e}ria D.",
editor = "Souza, Marlo and
de-Dios-Flores, Iria and
Santos, Diana and
Freitas, Larissa and
Souza, Jackson Wilke da Cruz and
Ribeiro, Eug{\'e}nio",
booktitle = "Proceedings of the 17th International Conference on Computational Processing of {P}ortuguese ({PROPOR} 2026) - Vol. 1",
month = apr,
year = "2026",
address = "Salvador, Brazil",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-dnd/2026.propor-1.43/",
pages = "436--445",
ISBN = "979-8-89176-387-6",
abstract = "This paper presents a comparative evaluation of automatic classification strategies for Brazilian university entrance exam questions by subject and fine-grained topic. A central contribution of this study is the creation and curation of a large-scale Portuguese-language dataset comprising approximately 17,000 questions collected from the Agatha.edu platform, carefully cleaned and normalized. We investigated two alternative classification strategies: a single-step approach that directly predicts fine-grained topics and a two-stage approach in which an initial model predicts the subject, followed by specialized topic classifiers. These strategies were evaluated using both classical machine learning methods, such as Support Vector Machines, Naive Bayes, and Random Forest, and transformer-based language models pre-trained for Portuguese. Experimental results show the feasibility of large-scale automatic question classification and highlight the potential of NLP-based classification strategies to support the curation, analysis, and organization of educational question banks."
}Markdown (Informal)
[Automatic Question classification in Portuguese: A Large-Scale Dataset and Comparative Evaluation of Classification Strategies](https://preview.aclanthology.org/ingest-dnd/2026.propor-1.43/) (Boccardo & Feltrim, PROPOR 2026)
ACL