@inproceedings{ebrahimi-etal-2025-adversary,
title = "An Adversary-Resistant Multi-Agent {LLM} System via Credibility Scoring",
author = "Ebrahimi, Sana and
Dehghankar, Mohsen and
Asudeh, Abolfazl",
editor = "Inui, Kentaro and
Sakti, Sakriani and
Wang, Haofen and
Wong, Derek F. and
Bhattacharyya, Pushpak and
Banerjee, Biplab and
Ekbal, Asif and
Chakraborty, Tanmoy and
Singh, Dhirendra Pratap",
booktitle = "Proceedings of the 14th International Joint Conference on Natural Language Processing and the 4th Conference of the Asia-Pacific Chapter of the Association for Computational Linguistics",
month = dec,
year = "2025",
address = "Mumbai, India",
publisher = "The Asian Federation of Natural Language Processing and The Association for Computational Linguistics",
url = "https://preview.aclanthology.org/ingest-ijcnlp-aacl/2025.ijcnlp-long.90/",
pages = "1676--1693",
ISBN = "979-8-89176-298-5",
abstract = "While multi-agent LLM systems show strong capabilities in various domains, they are highly vulnerable to adversarial and low-performing agents. To resolve this issue, in this paper, we introduce a general and adversary-resistant multi-agent LLM framework based on credibility scoring. We model the collaborative query-answering process as an iterative game, where the agents communicate and contribute to a final system output. Our system associates a credibility score that is used when aggregating the team outputs. The credibility scores are learned gradually based on the past contributions of each agent in query answering. Our experiments across multiple tasks and settings demonstrate our system{'}s effectiveness in mitigating adversarial influence and enhancing the resilience of multi-agent cooperation, even in the adversary-majority settings."
}Markdown (Informal)
[An Adversary-Resistant Multi-Agent LLM System via Credibility Scoring](https://preview.aclanthology.org/ingest-ijcnlp-aacl/2025.ijcnlp-long.90/) (Ebrahimi et al., IJCNLP-AACL 2025)
ACL
- Sana Ebrahimi, Mohsen Dehghankar, and Abolfazl Asudeh. 2025. An Adversary-Resistant Multi-Agent LLM System via Credibility Scoring. In Proceedings of the 14th International Joint Conference on Natural Language Processing and the 4th Conference of the Asia-Pacific Chapter of the Association for Computational Linguistics, pages 1676–1693, Mumbai, India. The Asian Federation of Natural Language Processing and The Association for Computational Linguistics.