@inproceedings{colonel-lin-2025-word,
title = "Word Clouds as Common Voices: {LLM}-Assisted Visualization of Participant-Weighted Themes in Qualitative Interviews",
author = "Colonel, Joseph T and
Lin, Baihan",
editor = "Blodgett, Su Lin and
Curry, Amanda Cercas and
Dev, Sunipa and
Li, Siyan and
Madaio, Michael and
Wang, Jack and
Wu, Sherry Tongshuang and
Xiao, Ziang and
Yang, Diyi",
booktitle = "Proceedings of the Fourth Workshop on Bridging Human-Computer Interaction and Natural Language Processing (HCI+NLP)",
month = nov,
year = "2025",
address = "Suzhou, China",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-emnlp/2025.hcinlp-1.14/",
pages = "169--177",
ISBN = "979-8-89176-353-1",
abstract = "Word clouds are a common way to summarize qualitative interviews, yet traditional frequency-based methods often fail in conversational contexts: they surface filler words, ignore paraphrase, and fragment semantically related ideas. This limits their usefulness in early-stage analysis, when researchers need fast, interpretable overviews of what participant actually said. We introduce ThemeClouds, an open-source visualization tool that uses large language models (LLMs) to generate thematic, participant-weighted word clouds from dialogue transcripts. The system prompts an LLM to identify concept-level themes across a corpus and then counts how many unique participants mention each topic, yielding a visualization grounded in breadth of mention rather than raw term frequency. Researchers can customize prompts and visualization parameters, providing transparency and control. Using interviews from a user study comparing five recording-device configurations (31 participants; 155 transcripts, Whisper ASR), our approach surfaces more actionable device concerns than frequency clouds and topic-modeling baselines (e.g., LDA, BERTopic). We discuss design trade-offs for integrating LLM assistance into qualitative workflows, implications for interpretability and researcher agency, and opportunities for interactive analyses such as per-condition contrasts ({``}diff clouds'')."
}Markdown (Informal)
[Word Clouds as Common Voices: LLM-Assisted Visualization of Participant-Weighted Themes in Qualitative Interviews](https://preview.aclanthology.org/ingest-emnlp/2025.hcinlp-1.14/) (Colonel & Lin, HCINLP 2025)
ACL