@inproceedings{cieslak-czyzewski-2026-locality,
title = "Does Locality Cost in {P}olish Medical Text Classification? Duplicate-Aware Evaluation of Federated Learning",
author = "Cie{\'s}lak, Daniel and
Czy{\.z}ewski, Andrzej",
editor = "T.Y.S.S., Santosh and
Rodriguez, Juan Diego and
de Gibert, Ona",
booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics ({ACL} 2026)",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.acl-srw.44/",
pages = "498--508",
ISBN = "979-8-89176-393-7",
abstract = "Federated learning is often framed as a practical trade-off in clinical NLP: safer data handling at the cost of lower predictive performance. We revisit this assumption in a benchmark-specific study of Polish medical text classification. A key issue is evaluation granularity: the test split contains 10,634 rows but only 670 unique normalized text hashes, with 18 inconsistent groups removed in strict grouped evaluation. We therefore compare centralized and federated training under both conventional instance-level scoring and a stricter hash-level protocol that controls duplicate inflation. In the strongest reported settings, federated training matches or slightly exceeds the centralized baseline, reaching instance-level Macro-F1 of 0.8826 {\ensuremath{\pm}} 0.0177 versus 0.8689 {\ensuremath{\pm}} 0.0124, and hash-level Macro-F1 of 0.8908 {\ensuremath{\pm}} 0.0220 versus 0.8841 {\ensuremath{\pm}} 0.0078. The claim is deliberately narrow: we do not argue that federated learning is generally superior to centralized training, nor do we claim formal privacy guarantees. Rather, we show that in this duplicate-heavy Polish medical text benchmark, conclusions about locality depend strongly on evaluation hygiene."
}Markdown (Informal)
[Does Locality Cost in Polish Medical Text Classification? Duplicate-Aware Evaluation of Federated Learning](https://preview.aclanthology.org/ingest-acl/2026.acl-srw.44/) (Cieślak & Czyżewski, ACL 2026)
ACL