@inproceedings{miyagawa-etal-2026-quantifying,
title = "Quantifying Text Reuse Across Three Kṛṣṇa Yajurveda Recensions: Using Multi-Algorithm Computational Collation",
author = "Miyagawa, So and
Amano, Kyoko and
Tsukagoshi, Yuzuki and
Kyogoku, Yuki",
editor = {Hamilton, Sil and
{\"O}hman, Emily and
Hicke, Rebecca M. M. and
Bizzoni, Yuri and
Bax, Axel and
Matthews, Jacob A. and
H{\"a}m{\"a}l{\"a}inen, Mika},
booktitle = "Proceedings of the 6th International Conference on Natural Language Processing for the Digital Humanities",
month = jul,
year = "2026",
address = "San Diego, USA",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl-workshops/2026.nlp4dh-1.5/",
pages = "41--49",
ISBN = "979-8-89176-427-9",
abstract = "The Kṛṣṇa Yajurveda survives in multiple recensions that share substantial ritual content, yet the degree and distribution of textual overlap across recensions have never been quantified systematically. This paper presents a computational analysis of text reuse across three recensions{---}the Maitr{\={a}}yaṇ{\={i}} Saṃhit{\={a}} (MS), the K{\={a}}ṭhaka Saṃhit{\={a}} (KS), and the Taittir{\={i}}ya Saṃhit{\={a}} (TS){---}for two ritual sections (Agnyupasth{\={a}}na and Punar{\={a}}dh{\={a}}na), using ICoMa (Intertextuality Collation Machine), a new web-based multi-algorithm collation tool. Five independent similarity algorithms consistently rank MS{--}KS as the most closely related pair, corroborating the philological consensus. Crucially, the two ritual sections exhibit strikingly different reuse profiles: Punar{\={a}}dh{\={a}}na shows near-identical MS{--}KS overlap (up to 93.5{\%}) with sharp divergence from TS, while Agnyupasth{\={a}}na displays moderate, broadly distributed similarity across all three pairs. These contrasting patterns provide quantitative evidence that different ritual categories followed distinct paths of textual transmission within the Yajurvedic tradition. ICoMa and the experimental data are freely available."
}Markdown (Informal)
[Quantifying Text Reuse Across Three Kṛṣṇa Yajurveda Recensions: Using Multi-Algorithm Computational Collation](https://preview.aclanthology.org/ingest-acl-workshops/2026.nlp4dh-1.5/) (Miyagawa et al., NLP4DH 2026)
ACL