@inproceedings{morris-etal-2025-using,
    title = "Using Whisper Embeddings for Audio-Only Latent Token Classification of Classroom Management Practices",
    author = "Morris, Wesley Griffith  and
      Vitale, Jessica  and
      Arvelo, Isabel",
    editor = "Wilson, Joshua  and
      Ormerod, Christopher  and
      Beiting Parrish, Magdalen",
    booktitle = "Proceedings of the Artificial Intelligence in Measurement and Education Conference (AIME-Con): Full Papers",
    month = oct,
    year = "2025",
    address = "Wyndham Grand Pittsburgh, Downtown, Pittsburgh, Pennsylvania, United States",
    publisher = "National Council on Measurement in Education (NCME)",
    url = "https://preview.aclanthology.org/ingest-emnlp/2025.aimecon-main.17/",
    pages = "154--162",
    ISBN = "979-8-218-84228-4",
    abstract = "In this study, we developed a textless NLP system using a fine-tuned Whisper encoder to identify classroom management practices from noisy classroom recordings. The model segments teacher speech from non-teacher speech and performs multi-label classification of classroom practices, achieving acceptable accuracy without requiring transcript generation."
}Markdown (Informal)
[Using Whisper Embeddings for Audio-Only Latent Token Classification of Classroom Management Practices](https://preview.aclanthology.org/ingest-emnlp/2025.aimecon-main.17/) (Morris et al., AIME-Con 2025)
ACL