@inproceedings{hatami-etal-2025-leveraging,
title = "Leveraging Visual Scene Graph to Enhance Translation Quality in Multimodal Machine Translation",
author = "Hatami, Ali and
Arcan, Mihael and
Buitelaar, Paul",
editor = "Bouillon, Pierrette and
Gerlach, Johanna and
Girletti, Sabrina and
Volkart, Lise and
Rubino, Raphael and
Sennrich, Rico and
Farinha, Ana C. and
Gaido, Marco and
Daems, Joke and
Kenny, Dorothy and
Moniz, Helena and
Szoc, Sara",
booktitle = "Proceedings of Machine Translation Summit XX: Volume 1",
month = jun,
year = "2025",
address = "Geneva, Switzerland",
publisher = "European Association for Machine Translation",
url = "https://preview.aclanthology.org/mtsummit-25-ingestion/2025.mtsummit-1.27/",
pages = "353--364",
ISBN = "978-2-9701897-0-1",
abstract = "Despite significant advancements in Multimodal Machine Translation, understanding and effectively utilising visual scenes within multimodal models remains a complex challenge. Extracting comprehensive and relevant visual features requires extensive and detailed input data to ensure the model accurately captures objects, their attributes, and relationships within a scene. In this paper, we explore using visual scene graphs extracted from images to enhance the performance of translation models. We investigate this approach for integrating Visual Scene Graph information into translation models, focusing on representing this information in a semantic structure rather than relying on raw image data. The performance of our approach was evaluated on the Multi30K dataset for English into German, French, and Czech translations using BLEU, chrF2, TER and COMET metrics. Our results demonstrate that utilising visual scene graph information improves translation performance. Using information on semantic structure can improve the multimodal baseline model, leading to better contextual understanding and translation accuracy."
}
Markdown (Informal)
[Leveraging Visual Scene Graph to Enhance Translation Quality in Multimodal Machine Translation](https://preview.aclanthology.org/mtsummit-25-ingestion/2025.mtsummit-1.27/) (Hatami et al., MTSummit 2025)
ACL