@inproceedings{paul-etal-2026-ilsic,
title = "{ILSIC}: Corpora for Identifying {I}ndian Legal Statutes from Queries by Laymen",
author = "Paul, Shounak and
Dogra, Raghav and
Goyal, Pawan and
Ghosh, Saptarshi",
editor = "Demberg, Vera and
Inui, Kentaro and
Marquez, Llu{\'i}s",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {EACL} 2026",
month = mar,
year = "2026",
address = "Rabat, Morocco",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-eacl/2026.findings-eacl.354/",
pages = "6725--6746",
ISBN = "979-8-89176-386-9",
abstract = "Legal Statute Identification (LSI) for a given situation is one of the most fundamental tasks in Legal NLP. This task has traditionally been modeled using facts from court judgments as input queries, due to their abundance. However, in practical settings, the input queries are likely to be informal and asked by laypersons, or non-professionals. While a few laypeople LSI datasets exist, there has been little research to explore the differences between court and laypeople data for LSI. In this work, we create ILSIC, a corpus of laypeople queries covering 500+ statutes from Indian law. Additionally, the corpus also contains court case judgements to enable researchers to effectively compare between court and laypeople data for LSI. We conducted extensive experiments on our corpus, including benchmarking over the laypeople dataset using zero and few-shot inference, retrieval-augmented generation and supervised fine-tuning. We observe that models trained purely on court judgements are ineffective during test on laypeople queries, while transfer learning from court to laypeople data can be beneficial in certain scenarios. We also conducted fine-grained analyses of our results in terms of categories of queries and frequency of statutes."
}Markdown (Informal)
[ILSIC: Corpora for Identifying Indian Legal Statutes from Queries by Laymen](https://preview.aclanthology.org/ingest-eacl/2026.findings-eacl.354/) (Paul et al., Findings 2026)
ACL