@inproceedings{harde-etal-2025-lecnet,
title = "{L}e{CN}et: A Legal Citation Network Benchmark Dataset",
author = "Harde, Pooja and
Jain, Bhavya and
Jain, Sarika",
editor = "Modi, Ashutosh and
Ghosh, Saptarshi and
Ekbal, Asif and
Goyal, Pawan and
Jain, Sarika and
Joshi, Abhinav and
Mishra, Shivani and
Datta, Debtanu and
Paul, Shounak and
Singh, Kshetrimayum Boynao and
Kumar, Sandeep",
booktitle = "Proceedings of the 1st Workshop on NLP for Empowering Justice (JUST-NLP 2025)",
month = dec,
year = "2025",
address = "Mumbai, India",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-ijcnlp-aacl/2025.justnlp-main.4/",
pages = "18--28",
ISBN = "979-8-89176-312-8",
abstract = "Legal document analysis is pivotal in modern judicial systems, particularly for case retrieval, classification, and recommendation tasks. Graph neural networks (GNNs) have revolutionized legal use cases by enabling the efficient analysis of complex relationships. Although existing legal citation network datasets have significantly advanced research in this domain, the lack of large-scale open-source datasets tailored to the Indian judicial system has limited progress. To address this gap, we present the Indian Legal Citation Network (LeCNet) - the first open-source benchmark dataset for the link prediction task (missing citation recommendation) in the Indian judicial context. The dataset has been created by extracting information from the original judgments. LeCNet comprises 26,308 nodes representing case judgments and 67,108 edges representing citation relationships between the case nodes. Each node is described with rich features of document embeddings that incorporate contextual information from the case documents. Baseline experiments using various machine learning models were conducted for dataset validation. The Mean Reciprocal Rank (MRR) metric is used for model evaluation. The results obtained demonstrate the utility of the LeCNet dataset, highlighting the advantages of graph-based representations over purely textual models."
}Markdown (Informal)
[LeCNet: A Legal Citation Network Benchmark Dataset](https://preview.aclanthology.org/ingest-ijcnlp-aacl/2025.justnlp-main.4/) (Harde et al., JUSTNLP 2025)
ACL
- Pooja Harde, Bhavya Jain, and Sarika Jain. 2025. LeCNet: A Legal Citation Network Benchmark Dataset. In Proceedings of the 1st Workshop on NLP for Empowering Justice (JUST-NLP 2025), pages 18–28, Mumbai, India. Association for Computational Linguistics.