@inproceedings{khan-etal-2026-stoicllm,
title = "{S}toic{LLM}: Preference Optimization for Philosophical Alignment in Small Language Models",
author = "Khan, Ishmam and
Thogarrati, Sindhuja and
Zhang, Shuo",
editor = {Hamilton, Sil and
{\"O}hman, Emily and
Hicke, Rebecca M. M. and
Bizzoni, Yuri and
Bax, Axel and
Matthews, Jacob A. and
H{\"a}m{\"a}l{\"a}inen, Mika},
booktitle = "Proceedings of the 6th International Conference on Natural Language Processing for the Digital Humanities",
month = jul,
year = "2026",
address = "San Diego, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl-workshops/2026.nlp4dh-1.32/",
pages = "355--367",
ISBN = "979-8-89176-427-9",
abstract = "While large language models excel at factual adaptation, their ability to internalize nuanced philosophical frameworks under severe data constraints remains underexplored. We investigate this by specializing small LLMs on micro-datasets of foundational Stoic texts using preference optimization (ORPO, AlphaPO). Evaluated via a multi-model critic bank, our results show that just 300 high-fidelity examples can induce strong alignment with inward-facing Stoic virtues, closely approaching few-shot prompting while freeing the context window. Critically, however, all models, including few-shot baselines, exhibit a persistent failure on Stoicism{'}s outward-facing cosmopolitan duties, pointing to a representational limitation of small models that micro-dataset adaptation alone cannot overcome."
}Markdown (Informal)
[StoicLLM: Preference Optimization for Philosophical Alignment in Small Language Models](https://preview.aclanthology.org/ingest-acl-workshops/2026.nlp4dh-1.32/) (Khan et al., NLP4DH 2026)
ACL