@inproceedings{baud-etal-2026-agent,
title = "Agent for Numerical Data Retrieval and Understanding by Code Generation and Multimodal Reasoning",
author = "Baud, Florian and
Almuhisen, Feda and
Midou, Dorian",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-acl/2026.findings-acl.1924/",
pages = "38630--38653",
ISBN = "979-8-89176-395-1",
abstract = "Numerical data from sensors and time series are widely used in scientific research fields such as nuclear fusion experiments, which generate vast amounts of complex, high-dimensional data. Therefore, efficient numerical data analysis tools are crucial to accelerate experimental research. Large language models (LLMs) have emerged as promising solutions to analyze numerical data with natural language queries. However, LLMs have difficulties treating this type of data as they have been designed for text in the first place. To overcome these limitations, we propose a model-agnostic and data-agnostic agent that processes numerical data by code generation and multimodal reasoning. Our agent demonstrates competitive performance against baselines on benchmark data on numerical data tasks such as sensor data classification and time series understanding. While outperforming them on information retrieval benchmarks, also we have successfully applied our agent in the context of nuclear fusion research, where physicists and Tokamak operators interact with it to plan and analyze fusion experiments."
}Markdown (Informal)
[Agent for Numerical Data Retrieval and Understanding by Code Generation and Multimodal Reasoning](https://preview.aclanthology.org/ingest-acl/2026.findings-acl.1924/) (Baud et al., Findings 2026)
ACL