@inproceedings{nursal-mitchell-2026-understanding,
title = "Understanding {LLM}s' summarization capabilities: an analysis of biomedical abstract and lay summary generation",
author = "Nursal, Batuhan and
Mitchell, Cassie S.",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl-workshops/2026.findings-acl.554/",
pages = "11393--11417",
ISBN = "979-8-89176-395-1",
abstract = "Scientific abstracts and lay summaries serve distinct but critical roles in research communication. Abstracts use technical language for academic audiences, while lay summaries aim to make findings accessible to non-specialists. With the rise of large language models (LLMs), there is increasing interest in automating the generation of both types of summaries{---}especially in the biomedical domain, where clarity and factual accuracy are essential. This study evaluates the performance of lightweight LLMs (under 8B parameters) in generating biomedical abstracts and lay summaries in a zero-shot setting. We assess outputs across three key dimensions: relevance, readability, and factuality. Additionally, we introduce a novel analysis of the sectional origin and desirability of information{---}where desirability reflects the utility of content from the reader{'}s perspective. We further compare human and LLM preferences using an objective ranking task. Our results show that LLM-generated summaries often contain comparable levels of desirable information to gold-standard human references. In several cases, LLM outputs are preferred by human evaluators and occasionally mistaken for human-authored text. These findings demonstrate the potential of lightweight LLMs for scalable, high-quality summarization and suggest their practical use in domains requiring both technical and accessible communication. The codebase for this study is publicly available on GitHub: https://github.com/batuinmetz/Understanding-LLMs-summarization-capabilities"
}Markdown (Informal)
[Understanding LLMs’ summarization capabilities: an analysis of biomedical abstract and lay summary generation](https://preview.aclanthology.org/ingest-acl-workshops/2026.findings-acl.554/) (Nursal & Mitchell, Findings 2026)
ACL