@inproceedings{f418212db9a54dd19c099b5ef52ec603,
title = "A Report on the FigLang 2024 Shared Task on Multimodal Figurative Language",
abstract = "We present the outcomes of the Multimodal Figurative Language Shared Task held at the 4th Workshop on Figurative Language Processing (FigLang 2024) co-located at NAACL 2024. The task utilized the V-FLUTE dataset (Saakyan et al., 2024) which is comprised of pairs that use figurative language and includes detailed textual explanations for the entailment or contradiction relationship of each pair. The challenge for participants was to develop models capable of accurately identifying the visual entailment relationship in these multimodal instances and generating persuasive free-text explanations. The results showed that the participants{\textquoteright} models significantly outperformed the initial baselines in both automated and human evaluations. We also provide an overview of the systems submitted and analyze the results of the evaluations. All participating systems outperformed the LLaVA-ZS baseline, provided by us in F1-score.",
author = "Shreyas Kulkarni and Arkadiy Saakyan and Tuhin Chakrabarty and Smaranda Muresan",
note = "Publisher Copyright: {\textcopyright} 2024 Association for Computational Linguistics.; 4th Workshop on Figurative Language Processing, FigLang 2024 ; Conference date: 21-06-2024",
year = "2024",
doi = "10.18653/v1/2024.figlang-1.16",
language = "English",
series = "FigLang 2024 - 4th Workshop on Figurative Language Processing, Proceedings of the Workshop",
publisher = "Association for Computational Linguistics (ACL)",
pages = "115--119",
editor = "Debanjan Ghosh and Smaranda Muresan and Anna Feldman and Tuhin Chakrabarty and Emmy Liu",
booktitle = "FigLang 2024 - 4th Workshop on Figurative Language Processing, Proceedings of the Workshop",
}