@inproceedings{sternlicht-hope-2026-chimera,
title = "{CHIMERA}: A Knowledge Base of Scientific Idea Recombinations for Research Analysis and Ideation",
author = "Sternlicht, Noy and
Hope, Tom",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Proceedings of the 64th Annual Meeting of the {A}ssociation for {C}omputational {L}inguistics (Volume 1: Long Papers)",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.acl-long.85/",
pages = "1871--1905",
ISBN = "979-8-89176-390-6",
abstract = "A hallmark of human innovation is recombination{---}the creation of novel ideas by integrating elements from existing concepts and mechanisms. In this work, we introduce CHIMERA, the first large-scale Knowledge Base (KB) of recombination examples automatically mined from the scientific literature. CHIMERA enables empirical analysis of how scientists recombine concepts and draw inspiration from different areas, and enables training models that propose cross-disciplinary research directions. To construct this KB, we define a new information extraction task: identifying recombination instances in papers. We curate an expert-annotated dataset and use it to fine-tune an LLM-based extraction model, which we apply to a broad corpus of AI papers. We also demonstrate generalization to a biological domain. We showcase the utility of CHIMERA through two applications. First, we analyze patterns of recombination across AI subfields. Second, we train a scientific hypothesis generation model using the KB, showing that it can propose directions that researchers rate as inspiring."
}Markdown (Informal)
[CHIMERA: A Knowledge Base of Scientific Idea Recombinations for Research Analysis and Ideation](https://preview.aclanthology.org/ingest-acl/2026.acl-long.85/) (Sternlicht & Hope, ACL 2026)
ACL