@inproceedings{alper-etal-2026-conlangcrafter,
title = "{C}onlang{C}rafter: Constructing Languages with a Multi-Hop {LLM} Pipeline",
author = "Alper, Morris and
Yanuka, Moran and
Giryes, Raja and
Begus, Gasper",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics (Volume 1: Long Papers)",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.acl-long.422/",
pages = "9318--9349",
ISBN = "979-8-89176-390-6",
abstract = "Constructed languages (conlangs) such as Esperanto and Quenya have played diverse roles in art, philosophy, and international communication. Meanwhile, foundation models have revolutionized creative generation in text, images, and beyond. In this work, we leverage modern LLMs as computational creativity aids for end-to-end conlang creation. We introduce ConlangCrafter, a multi-hop pipeline that decomposes language design into modular stages {--} phonology, morphology, syntax, lexicon generation, and translation. At each stage, our method leverages LLMs' metalinguistic reasoning capabilities, injecting randomness to encourage diversity and leveraging self-refinement feedback to encourage consistency in the emerging language description. We construct a novel, scalable evaluation framework for this task, evaluating metrics measuring consistency and typological diversity. Automatic and manual evaluations demonstrate ConlangCrafter{'}s ability to produce coherent and varied conlangs without human linguistic expertise. We will release our code and data."
}Markdown (Informal)
[ConlangCrafter: Constructing Languages with a Multi-Hop LLM Pipeline](https://preview.aclanthology.org/ingest-acl/2026.acl-long.422/) (Alper et al., ACL 2026)
ACL
- Morris Alper, Moran Yanuka, Raja Giryes, and Gasper Begus. 2026. ConlangCrafter: Constructing Languages with a Multi-Hop LLM Pipeline. In Proceedings of the 64th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pages 9318–9349, San Diego, California, United States. Association for Computational Linguistics.