@article{cao-etal-2026-graph,
title = "Graph-{T}emp{CZ}: A Graph Representation of Software Mentions for Predicting Software Usage in Scientific Publications",
author = "Cao, Congfeng and
Zhang, Pengyu and
Bloem, Jelke",
editor = "Piperidis, Stelios and
Bel, N{\'u}ria and
van den Heuvel, Henk and
Ide, Nancy and
Krek, Simon and
Toral, Antonio",
journal = "International Conference on Language Resources and Evaluation",
volume = "main",
month = may,
year = "2026",
address = "Palma de Mallorca, Spain",
publisher = "ELRA Language Resource Association",
url = "https://preview.aclanthology.org/ingest-lrec/2026.lrec-main.619/",
pages = "7791--7803",
abstract = "Predicting how software is used, shared, and evolves across publications is essential to studying scientific progress. Existing methods for representing software usage in publications rely mainly on tabular or textual formats, which limit their structural expressiveness and consequently their ability to predict software usage. We address these gaps by representing software mentions and citations as a graph and formulating software usage prediction as a link prediction task. To support this study, we construct the first large-scale graph dataset of publication and software mentions, \textbf{Graph-TempCZ}, covering 1959-2022 with over six million mention relationships. Experiments using both traditional machine learning and Graph Neural Network (GNN) show that graph-based models substantially outperform feature-based baselines, achieving a 5.98{\%} improvement in test accuracy. Temporal experiments further reveal that models trained on one year generalize effectively to nearby years but show gradual performance decay as the temporal gap increases. This work provides the first comprehensive foundation for analyzing software usage through a temporal graph representation."
}Markdown (Informal)
[Graph-TempCZ: A Graph Representation of Software Mentions for Predicting Software Usage in Scientific Publications](https://preview.aclanthology.org/ingest-lrec/2026.lrec-main.619/) (Cao et al., LREC 2026)
ACL