@inproceedings{wang-etal-2024-smarttrim, title = "{S}mart{T}rim: Adaptive Tokens and Attention Pruning for Efficient Vision-Language Models", author = "Wang, Zekun and Chen, Jingchang and Zhou, Wangchunshu and Zhu, Haichao and Liang, Jiafeng and Shan, Liping and Liu, Ming and Xu, Dongliang and Yang, Qing and Qin, Bing", editor = "Calzolari, Nicoletta and Kan, Min-Yen and Hoste, Veronique and Lenci, Alessandro and Sakti, Sakriani and Xue, Nianwen", booktitle = "Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)", month = may, year = "2024", address = "Torino, Italia", publisher = "ELRA and ICCL", url = "https://preview.aclanthology.org/ingest_wac_2008/2024.lrec-main.1300/", pages = "14937--14953" }