{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,9]],"date-time":"2025-12-09T19:20:34Z","timestamp":1765308034565,"version":"3.46.0"},"publisher-location":"New York, NY, USA","reference-count":66,"publisher":"ACM","funder":[{"name":"Funda\u00e7\u00e3o para a Ci\u00eancia e Tecnologia","award":["UIDP\/04516\/2020"],"award-info":[{"award-number":["UIDP\/04516\/2020"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,10,27]]},"DOI":"10.1145\/3746027.3758166","type":"proceedings-article","created":{"date-parts":[[2025,10,25]],"date-time":"2025-10-25T05:44:48Z","timestamp":1761371088000},"page":"12399-12408","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["MoralCLIP: Contrastive Alignment of Vision-and-Language Representations with Moral Foundations Theory"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9829-0936","authenticated-orcid":false,"given":"Ana Carolina","family":"Condez","sequence":"first","affiliation":[{"name":"NOVA LINCS, NOVA School of Science and Technology, Caparica, Portugal"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0147-369X","authenticated-orcid":false,"given":"Diogo","family":"Tavares","sequence":"additional","affiliation":[{"name":"NOVA LINCS, NOVA School of Science and Technology, Caparica, Portugal"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6290-5719","authenticated-orcid":false,"given":"Jo\u00e3o","family":"Magalh\u00e3es","sequence":"additional","affiliation":[{"name":"NOVA LINCS, NOVA School of Science and Technology, Caparica, Portugal"}]}],"member":"320","published-online":{"date-parts":[[2025,10,27]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1037\/pspp0000470"},{"key":"e_1_3_2_1_2_1","first-page":"490","volume-title":"Proceedings of the Computational Humanities Research Conference 2023, Paris, France, December 6-8, 2023 (CEUR Workshop Proceedings","volume":"16","author":"Barancov\u00e1 Alexandra","year":"2023","unstructured":"Alexandra Barancov\u00e1, Melvin Wevers, and Nanne van Noord. 2023. Blind Dates: Examining the Expression of Temporality in Historical Photographs. In Proceedings of the Computational Humanities Research Conference 2023, Paris, France, December 6-8, 2023 (CEUR Workshop Proceedings, Vol. 3558), Artjoms Sela, Fotis Jannidis, and Iza Romanowska (Eds.). CEUR-WS.org, EPITA, 14-16 Rue Voltaire, 94270 Le Kremlin-Bic\u00eatre, France, 490-499. https:\/\/ceur-ws.org\/Vol-3558\/paper5790.pdf"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1146\/annurev-psych-022123-110258"},{"key":"e_1_3_2_1_4_1","unstructured":"Lucas Beyer Andreas Steiner Andr\u00e9 Susano Pinto Alexander Kolesnikov Xiao Wang Daniel Salz Maxim Neumann Ibrahim Alabdulmohsin Michael Tschannen Emanuele Bugliarello Thomas Unterthiner Daniel Keysers Skanda Koppula Fangyu Liu Adam Grycner Alexey Gritsenko Neil Houlsby Manoj Kumar Keran Rong Julian Eisenschlos Rishabh Kabra Matthias Bauer Matko Bo\u0161njak Xi Chen Matthias Minderer Paul Voigtlaender Ioana Bica Ivana Balazevic Joan Puigcerver Pinelopi Papalampidi Olivier Henaff Xi Xiong Radu Soricut Jeremiah Harmsen and Xiaohua Zhai. 2024. PaliGemma: A Versatile 3B VLM for Transfer. arXiv:2407.07726 https:\/\/arxiv.org\/abs\/2407.07726 Preprint."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/CBMI62980.2024.10859215"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.3389\/frai.2023.1125533"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0190954"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2305.06500"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.18653\/V1\/N19-1423"},{"key":"e_1_3_2_1_10_1","volume-title":"Proceedings of the Thirteenth International Conference on Learning Representations (ICLR","author":"Eslami Sedigheh","year":"2025","unstructured":"Sedigheh Eslami and Gerard de Melo. 2025. Mitigate the Gap: Improving Cross-Modal Alignment in CLIP. In Proceedings of the Thirteenth International Conference on Learning Representations (ICLR 2025). ICLR, Singapore, 15 pages. https:\/\/openreview.net\/forum?id=aPTGvFqile"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.18653\/V1\/2023.FINDINGS-EACL.88"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.3758\/s13428-017-0875-9"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1016\/B978-0-12-407236-7.00002-4"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1037\/a0015141"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1037\/a0021847"},{"key":"e_1_3_2_1_16_1","unstructured":"Candida Maria Greco Lorenzo Zangari Davide Picca and Andrea Tagarelli. 2024. E2MoCase: A Dataset for Emotional Event and Moral Observations in News Articles on High-impact Legal Cases. arXiv:2409.09001 [cs.CL] https:\/\/arxiv.org\/abs\/2409.09001"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1609\/ICWSM.V17I1.22145"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.neuroimage.2009.10.062"},{"key":"e_1_3_2_1_19_1","volume-title":"Proceedings of the 9th International Conference on Learning Representations (ICLR). OpenReview.net, Virtual Event, 29 pages. https:\/\/openreview.net\/forum?id=dNy_RKzJacY","author":"Hendrycks Dan","year":"2021","unstructured":"Dan Hendrycks, Collin Burns, Steven Basart, Andrew Critch, Jerry Li, Dawn Song, and Jacob Steinhardt. 2021. Aligning AI With Shared Human Values. In Proceedings of the 9th International Conference on Learning Representations (ICLR). OpenReview.net, Virtual Event, 29 pages. https:\/\/openreview.net\/forum?id=dNy_RKzJacY"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1525\/collabra.129"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1177\/1948550619876629"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.3758\/s13428-020-01433-0"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.emnlp-main.137"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.eacl-main.126"},{"key":"e_1_3_2_1_25_1","volume-title":"Proceedings of the 33rd British Machine Vision Conference (BMVC). BMVA Press","author":"Jeong Yujin","year":"2022","unstructured":"Yujin Jeong, Seongbeom Park, Suhong Moon, and Jinkyu Kim. 2022. Zero-shot Visual Commonsense Immorality Prediction. In Proceedings of the 33rd British Machine Vision Conference (BMVC). BMVA Press, London, UK, 320. https:\/\/bmvc2022.mpi-inf.mpg.de\/320\/"},{"key":"e_1_3_2_1_26_1","volume-title":"Proceedings of the 38th International Conference on Machine Learning, ICML 2021","volume":"4916","author":"Jia Chao","year":"2021","unstructured":"Chao Jia, Yinfei Yang, Ye Xia, Yi-Ting Chen, Zarana Parekh, Hieu Pham, Quoc V. Le, Yun-Hsuan Sung, Zhen Li, and Tom Duerig. 2021. Scaling Up Visual and Vision-Language Representation Learning With Noisy Text Supervision. In Proceedings of the 38th International Conference on Machine Learning, ICML 2021, 18-24 July 2021, Virtual Event (Proceedings of Machine Learning Research, Vol. 139), Marina Meila and Tong Zhang (Eds.). PMLR, Virtual Event, 4904-4916. http:\/\/proceedings.mlr.press\/v139\/jia21b.html"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1080\/15213269.2017.1378108"},{"volume-title":"Multimodality: A Social Semiotic Approach to Contemporary Communication","author":"Kress Gunther","key":"e_1_3_2_1_28_1","unstructured":"Gunther Kress. 2010. Where Meaning is the Issue. In Multimodality: A Social Semiotic Approach to Contemporary Communication. Routledge, London, UK, 1-17."},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.acl-long.241"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.brainres.2019.146513"},{"key":"e_1_3_2_1_31_1","volume-title":"Pang Wei Koh, and Simon Shaolei Du","author":"Li Siting","year":"2025","unstructured":"Siting Li, Pang Wei Koh, and Simon Shaolei Du. 2025. Exploring How Generative MLLMs Perceive More Than CLIP with the Same Vision Encoder. arXiv:2411.05195 [cs.LG] https:\/\/arxiv.org\/abs\/2411.05195"},{"key":"e_1_3_2_1_32_1","volume-title":"Zou","author":"Liang Weixin","year":"2022","unstructured":"Weixin Liang, Yuhui Zhang, Yongchan Kwon, Serena Yeung, and James Y. Zou. 2022. Mind the Gap: Understanding the Modality Gap in Multi-modal Contrastive Representation Learning. In Advances in Neural Information Processing Systems 35 (NeurIPS 2022), Sanmi Koyejo, S. Mohamed, A. Agarwal, Danielle Belgrave, K. Cho, and A. Oh (Eds.). Curran Associates, Inc., New Orleans, LA, USA, 28865-28878. http:\/\/papers.nips.cc\/paper_files\/paper\/2022\/hash\/702f4db7543a7432431df588d57bc7c9-Abstract-Conference.html"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72992-8_22"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","unstructured":"Yinhan Liu Myle Ott Naman Goyal Jingfei Du Mandar Joshi Danqi Chen Omer Levy Mike Lewis Luke Zettlemoyer and Veselin Stoyanov. 2019. RoBERTa: A Robustly Optimized BERT Pretraining Approach. doi:10.48550\/arXiv.1907.11692 arXiv:1907.11692 [cs].","DOI":"10.48550\/arXiv.1907.11692"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511809071"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.3389\/fpsyg.2021.599024"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0213343"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0206604"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1609\/ICWSM.V18I1.31378"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.25969\/mediarep\/2231"},{"key":"e_1_3_2_1_41_1","first-page":"654","volume-title":"Findings of the Association for Computational Linguistics: EACL 2024","author":"Park Jeongwoo","year":"2024","unstructured":"Jeongwoo Park, Enrico Liscio, and Pradeep K. Murukannaiah. 2024. Morality is Non-Binary: Building a Pluralist Moral Sentence Embedding Space using Contrastive Learning. In Findings of the Association for Computational Linguistics: EACL 2024. Association for Computational Linguistics, Julian's, Malta, 654-673. https:\/\/aclanthology.org\/2024.findings-eacl.45 arXiv:2401.17228 [cs]."},{"key":"e_1_3_2_1_42_1","first-page":"340","volume-title":"Proceedings of the European Conference on Computer Vision (ECCV)","author":"Poppi Samuele","year":"2024","unstructured":"Samuele Poppi, Tobia Poppi, Federico Cocchi, Marcella Cornia, Lorenzo Baraldi, and Rita Cucchiara. 2024. Safe-CLIP: Removing NSFW Concepts from Vision-and-Language Models. In Proceedings of the European Conference on Computer Vision (ECCV) 2024. Springer, Milan, Italy, 340-356. Available online at: https:\/\/github.com\/aimagelab\/safe-clip."},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1145\/3677525.3678694"},{"key":"e_1_3_2_1_44_1","volume-title":"Proceedings of the 38th International Conference on Machine Learning (Proceedings of Machine Learning Research","volume":"8763","author":"Radford Alec","year":"2021","unstructured":"Alec Radford, Jong Wook Kim, Chris Hallacy, Aditya Ramesh, Gabriel Goh, Sandhini Agarwal, Girish Sastry, Amanda Askell, Pamela Mishkin, Jack Clark, Gretchen Krueger, and Ilya Sutskever. 2021. Learning Transferable Visual Models From Natural Language Supervision. In Proceedings of the 38th International Conference on Machine Learning (Proceedings of Machine Learning Research, Vol. 139). PMLR, Virtual, 8748-8763."},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.1016\/0377-0427(87)90125-7"},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"publisher","DOI":"10.1177\/0894439313506837"},{"key":"e_1_3_2_1_48_1","volume-title":"LAION-400M: Open Dataset of CLIP-Filtered 400 Million Image-Text Pairs. CoRR","author":"Schuhmann Christoph","year":"2021","unstructured":"Christoph Schuhmann, Richard Vencu, Romain Beaumont, Robert Kaczmarczyk, Clayton Mullis, Aarush Katta, Theo Coombes, Jenia Jitsev, and Aran Komatsuzaki. 2021. LAION-400M: Open Dataset of CLIP-Filtered 400 Million Image-Text Pairs. CoRR, Vol. abs\/2111.02114 (2021), 5 pages. arXiv:2111.02114 https:\/\/arxiv.org\/abs\/2111.02114"},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00659"},{"key":"e_1_3_2_1_50_1","doi-asserted-by":"publisher","DOI":"10.1108\/JCOM-01-2023-0006"},{"key":"e_1_3_2_1_51_1","doi-asserted-by":"publisher","DOI":"10.1080\/15205436.2017.1342130"},{"key":"e_1_3_2_1_52_1","doi-asserted-by":"publisher","unstructured":"Jackson Trager Alireza S. Ziabari Aida Mostafazadeh Davani Preni Golazizian Farzan Karimi-Malekabadi Ali Omrani Zhihe Li Brendan Kennedy Nils Karl Reimer Melissa Reyes Kelsey Cheng Mellow Wei Christina Merrifield Arta Khosravi Evans Alvarez and Morteza Dehghani. 2022. The Moral Foundations Reddit Corpus. doi:10.48550\/arXiv.2208.05545 arXiv:2208.05545 [cs].","DOI":"10.48550\/arXiv.2208.05545"},{"key":"e_1_3_2_1_53_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.2502.14786"},{"key":"e_1_3_2_1_54_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11097-023-09918-x"},{"key":"e_1_3_2_1_55_1","doi-asserted-by":"publisher","unstructured":"Vik Korrapati. 2024. moondream2 (Revision 92d3d73). doi:10.57967\/hf\/3219","DOI":"10.57967\/hf\/3219"},{"key":"e_1_3_2_1_56_1","doi-asserted-by":"publisher","DOI":"10.1080\/19312458.2018.1447656"},{"key":"e_1_3_2_1_57_1","doi-asserted-by":"publisher","DOI":"10.1348\/026151005X74153"},{"key":"e_1_3_2_1_58_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-15428-8"},{"key":"e_1_3_2_1_59_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.309"},{"key":"e_1_3_2_1_60_1","doi-asserted-by":"publisher","unstructured":"Bei Yan Jie Zhang Zhiyuan Chen Shiguang Shan and Xilin Chen. 2024. Mtextsuperscript3oralBench: A MultiModal Moral Benchmark for LVLMs. doi:10.48550\/arXiv.2412.20718 arXiv:2412.20718 [cs].","DOI":"10.48550\/arXiv.2412.20718"},{"key":"e_1_3_2_1_61_1","volume-title":"Proceedings of the 31st International Conference on Computational Linguistics, Owen Rambow, Leo Wanner, Marianna Apidianaki, Hend Al-Khalifa","author":"Zangari Lorenzo","year":"2025","unstructured":"Lorenzo Zangari, Candida M. Greco, Davide Picca, and Andrea Tagarelli. 2025. ME2-BERT: Are Events and Emotions what you need for Moral Foundation Prediction?. In Proceedings of the 31st International Conference on Computational Linguistics, Owen Rambow, Leo Wanner, Marianna Apidianaki, Hend Al-Khalifa, Barbara Di Eugenio, and Steven Schockaert (Eds.). Association for Computational Linguistics, Abu Dhabi, UAE, 9516-9532. https:\/\/aclanthology.org\/2025.coling-main.638\/"},{"key":"e_1_3_2_1_62_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01100"},{"key":"e_1_3_2_1_63_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72983-6_18"},{"key":"e_1_3_2_1_64_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.naacl-long.252"},{"key":"e_1_3_2_1_65_1","first-page":"1","volume-title":"Proceedings of the 12th International Conference on Learning Representations (ICLR). OpenReview.net","author":"Zhou Qihang","year":"2024","unstructured":"Qihang Zhou, Guansong Pang, Yu Tian, Shibo He, and Jiming Chen. 2024. AnomalyCLIP: Object-agnostic Prompt Learning for Zero-shot Anomaly Detection. In Proceedings of the 12th International Conference on Learning Representations (ICLR). OpenReview.net, Vienna, Austria, 1-33. https:\/\/openreview.net\/forum?id=buC4E91xZE"},{"key":"e_1_3_2_1_66_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-35995-8_3010.1007\/978-3-031-35995-8_30"}],"event":{"name":"MM '25: The 33rd ACM International Conference on Multimedia","sponsor":["SIGMM ACM Special Interest Group on Multimedia"],"location":"Dublin Ireland","acronym":"MM '25"},"container-title":["Proceedings of the 33rd ACM International Conference on Multimedia"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3746027.3758166","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,9]],"date-time":"2025-12-09T19:16:42Z","timestamp":1765307802000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3746027.3758166"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,27]]},"references-count":66,"alternative-id":["10.1145\/3746027.3758166","10.1145\/3746027"],"URL":"https:\/\/doi.org\/10.1145\/3746027.3758166","relation":{},"subject":[],"published":{"date-parts":[[2025,10,27]]},"assertion":[{"value":"2025-10-27","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}