{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,16]],"date-time":"2026-06-16T04:36:00Z","timestamp":1781584560165,"version":"3.54.5"},"publisher-location":"New York, NY, USA","reference-count":37,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,5,30]],"date-time":"2024-05-30T00:00:00Z","timestamp":1717027200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"name":"NORDIS","award":["101158604"],"award-info":[{"award-number":["101158604"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,5,30]]},"DOI":"10.1145\/3652583.3657587","type":"proceedings-article","created":{"date-parts":[[2024,6,7]],"date-time":"2024-06-07T06:30:40Z","timestamp":1717741840000},"page":"1275-1281","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":16,"title":["Overview of the Grand Challenge on Detecting Cheapfakes at ACM ICMR 2024"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-2761-2213","authenticated-orcid":false,"given":"Duc-Tien","family":"Dang-Nguyen","sequence":"first","affiliation":[{"name":"University of Bergen, Bergen, Norway"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5351-2278","authenticated-orcid":false,"given":"Sohail Ahmed","family":"Khan","sequence":"additional","affiliation":[{"name":"University of Bergen, Bergen, Norway"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3153-2064","authenticated-orcid":false,"given":"Michael","family":"Riegler","sequence":"additional","affiliation":[{"name":"SimulaMet, Oslo, Norway"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2073-7029","authenticated-orcid":false,"given":"P\u00e5l","family":"Halvorsen","sequence":"additional","affiliation":[{"name":"SimulaMet, Oslo, Norway"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8036-954X","authenticated-orcid":false,"given":"Anh-Duy","family":"Tran","sequence":"additional","affiliation":[{"name":"imec-DistriNet, KU Leuven, Leuven, Belgium"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3044-8175","authenticated-orcid":false,"given":"Minh-Son","family":"Dao","sequence":"additional","affiliation":[{"name":"National Institute of Information and Communications Technology, Tokyo, Japan"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3046-3041","authenticated-orcid":false,"given":"Minh-Triet","family":"Tran","sequence":"additional","affiliation":[{"name":"University of Science, Ho Chi Minh, Vietnam"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2024,6,7]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"COSMOS: Catching Out-of-Context Image Misuse Using Self-Supervised Learning. In AAAI Conference on Artificial Intelligence. https:\/\/api.semanticscholar.org\/CorpusID:259693535","author":"Aneja Shivangi","year":"2023","unstructured":"Shivangi Aneja, Chris Bregler, and Matthias Nie\u00dfner. 2023. COSMOS: Catching Out-of-Context Image Misuse Using Self-Supervised Learning. In AAAI Conference on Artificial Intelligence. https:\/\/api.semanticscholar.org\/CorpusID:259693535"},{"key":"e_1_3_2_1_2_1","unstructured":"S. Aneja C. Midoglu D. Dang-Nguyen M. A. Riegler P. Halvorsen Ma. Niessner B. Adsumilli and C. Bregler. 2021. MMSys'21 Grand Challenge on Detecting Cheapfakes. arxiv: 2107.05297 [cs.MM]"},{"key":"e_1_3_2_1_3_1","volume-title":"Somalia Military Forces. https:\/\/tinyurl.com\/2tbxjek2 Retrieved","author":"AP.","year":"2024","unstructured":"AP. 2016. Somalia Military Forces. https:\/\/tinyurl.com\/2tbxjek2 Retrieved April 20, 2024 from"},{"key":"e_1_3_2_1_4_1","volume-title":"Australia -- it's not a real photo. https:\/\/factcheck.afp.com\/virtual-image-was-created-artist-new-south-wales-australia-its-not-real-photo Retrieved","author":"Australia AFP","year":"2024","unstructured":"AFP Australia. 2020. This virtual image was created by an artist in New South Wales, Australia -- it's not a real photo. https:\/\/factcheck.afp.com\/virtual-image-was-created-artist-new-south-wales-australia-its-not-real-photo Retrieved April 20, 2024 from"},{"key":"e_1_3_2_1_5_1","volume-title":"Cise Midoglu, Michael Riegler, P\u00e5l Halvorsen, and Minh-Son Dao.","author":"Dang-Nguyen Duc-Tien","year":"2023","unstructured":"Duc-Tien Dang-Nguyen, Sohail Ahmed Khan, Cise Midoglu, Michael Riegler, P\u00e5l Halvorsen, and Minh-Son Dao. 2023. Grand challenge on detecting cheapfakes. arXiv preprint arXiv:2304.01328 (2023)."},{"key":"e_1_3_2_1_6_1","unstructured":"Peng Gao Jiaming Han Renrui Zhang Ziyi Lin Shijie Geng Aojun Zhou Wei Zhang Pan Lu Conghui He Xiangyu Yue et al. 2023. Llama-adapter v2: Parameter-efficient visual instruction model. arXiv preprint arXiv:2304.15010 (2023)."},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"e_1_3_2_1_8_1","volume-title":"Debertav3: Improving deberta using electra-style pre-training with gradient-disentangled embedding sharing. arXiv preprint arXiv:2111.09543","author":"He Pengcheng","year":"2021","unstructured":"Pengcheng He, Jianfeng Gao, and Weizhu Chen. 2021. Debertav3: Improving deberta using electra-style pre-training with gradient-disentangled embedding sharing. arXiv preprint arXiv:2111.09543 (2021)."},{"key":"e_1_3_2_1_9_1","volume-title":"Diego de las Casas, Florian Bressand, Gianna Lengyel, Guillaume Lample, Lucile Saulnier, et al.","author":"Jiang Albert Q","year":"2023","unstructured":"Albert Q Jiang, Alexandre Sablayrolles, Arthur Mensch, Chris Bamford, Devendra Singh Chaplot, Diego de las Casas, Florian Bressand, Gianna Lengyel, Guillaume Lample, Lucile Saulnier, et al. 2023. Mistral 7B. arXiv preprint arXiv:2310.06825 (2023)."},{"key":"e_1_3_2_1_10_1","volume-title":"Diego de las Casas, Emma Bou Hanna, Florian Bressand, et al.","author":"Jiang Albert Q","year":"2024","unstructured":"Albert Q Jiang, Alexandre Sablayrolles, Antoine Roux, Arthur Mensch, Blanche Savary, Chris Bamford, Devendra Singh Chaplot, Diego de las Casas, Emma Bou Hanna, Florian Bressand, et al. 2024. Mixtral of experts. arXiv preprint arXiv:2401.04088 (2024)."},{"key":"e_1_3_2_1_11_1","volume-title":"Advances in Neural Information Processing Systems","volume":"36","author":"Koh Jing Yu","year":"2024","unstructured":"Jing Yu Koh, Daniel Fried, and Russ R Salakhutdinov. 2024. Generating images with multimodal language models. Advances in Neural Information Processing Systems , Vol. 36 (2024)."},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1145\/3652583.3657602"},{"key":"e_1_3_2_1_13_1","volume-title":"Chanvichet Vong, and \"Teknium\".","author":"Lian Wing","year":"2023","unstructured":"Wing Lian, Bleys Goodson, Guan Wang, Eugene Pentland, Austin Cook, Chanvichet Vong, and \"Teknium\". 2023. MistralOrca: Mistral-7B Model Instruct-tuned on Filtered OpenOrcaV1 GPT-4 Dataset."},{"key":"e_1_3_2_1_14_1","volume-title":"Roberta: A robustly optimized bert pretraining approach. arXiv preprint arXiv:1907.11692","author":"Liu Yinhan","year":"2019","unstructured":"Yinhan Liu, Myle Ott, Naman Goyal, Jingfei Du, Mandar Joshi, Danqi Chen, Omer Levy, Mike Lewis, Luke Zettlemoyer, and Veselin Stoyanov. 2019. Roberta: A robustly optimized bert pretraining approach. arXiv preprint arXiv:1907.11692 (2019)."},{"key":"e_1_3_2_1_15_1","volume-title":"Yi Tay, Denny Zhou, Quoc V. Le, Barret Zoph, Jason Wei, and Adam Roberts.","author":"Longpre Shayne","year":"2023","unstructured":"Shayne Longpre, Le Hou, Tu Vu, Albert Webson, Hyung Won Chung, Yi Tay, Denny Zhou, Quoc V. Le, Barret Zoph, Jason Wei, and Adam Roberts. 2023. The Flan Collection: Designing Data and Methods for Effective Instruction Tuning. arxiv: 2301.13688 [cs.AI]"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"crossref","unstructured":"G. Luo T. Darrell and A. Rohrbach. 2021. NewsCLIPpings: Automatic Generation of Out-of-Context Multimodal Media. arxiv: 2104.05893 [cs.CV]","DOI":"10.18653\/v1\/2021.emnlp-main.545"},{"key":"e_1_3_2_1_17_1","volume-title":"Orca: Progressive Learning from Complex Explanation Traces of GPT-4. arxiv: 2306.02707 [cs.CL]","author":"Mukherjee Subhabrata","year":"2023","unstructured":"Subhabrata Mukherjee, Arindam Mitra, Ganesh Jawahar, Sahaj Agarwal, Hamid Palangi, and Ahmed Awadallah. 2023. Orca: Progressive Learning from Complex Explanation Traces of GPT-4. arxiv: 2306.02707 [cs.CL]"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/3652583.3657599"},{"key":"e_1_3_2_1_19_1","volume":"201","author":"Paris B.","unstructured":"B. Paris and J. Donovan. 2019. Deepfakes and cheapfakes: The manipulation of audio and visual evidence. https:\/\/datasociety.net\/wp-content\/uploads\/2019\/09\/DataSociety_Deepfakes_Cheap_Fakes.pdf Retrieved April 20, 2024 from","journal-title":"J. Donovan."},{"key":"e_1_3_2_1_20_1","volume-title":"2023 b. Deepfakes and cheapfakes: The manipulation of audio and visual evidence. https:\/\/openai.com\/blog\/gpt-3--5-turbo-fine-tuning-and-api-updates Retrieved","author":"Peng Andrew","year":"2024","unstructured":"Andrew Peng, Michael Wu, John Allard, Logan Kilpatrick, and Steven Heidel. 2023 b. Deepfakes and cheapfakes: The manipulation of audio and visual evidence. https:\/\/openai.com\/blog\/gpt-3--5-turbo-fine-tuning-and-api-updates Retrieved April 20, 2024 from"},{"key":"e_1_3_2_1_21_1","volume-title":"2023 a. Kosmos-2: Grounding multimodal large language models to the world. arXiv preprint arXiv:2306.14824","author":"Peng Zhiliang","year":"2023","unstructured":"Zhiliang Peng, Wenhui Wang, Li Dong, Yaru Hao, Shaohan Huang, Shuming Ma, and Furu Wei. 2023 a. Kosmos-2: Grounding multimodal large language models to the world. arXiv preprint arXiv:2306.14824 (2023)."},{"key":"e_1_3_2_1_22_1","volume-title":"Ookpik-A Collection of Out-of-Context Image-Caption Pairs. In International Conference on Multimedia Modeling. Springer, 132--144","author":"Pham Kha-Luan","year":"2024","unstructured":"Kha-Luan Pham, Minh-Khoi Nguyen-Nhat, Anh-Huy Dinh, Quang-Tri Le, Manh-Thien Nguyen, Anh-Duy Tran, Minh-Triet Tran, and Duc-Tien Dang-Nguyen. 2024 a. Ookpik-A Collection of Out-of-Context Image-Caption Pairs. In International Conference on Multimedia Modeling. Springer, 132--144."},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/3652583.3657597"},{"key":"e_1_3_2_1_24_1","volume-title":"Sdxl: Improving latent diffusion models for high-resolution image synthesis. arXiv preprint arXiv:2307.01952","author":"Podell Dustin","year":"2023","unstructured":"Dustin Podell, Zion English, Kyle Lacey, Andreas Blattmann, Tim Dockhorn, Jonas M\u00fcller, Joe Penna, and Robin Rombach. 2023. Sdxl: Improving latent diffusion models for high-resolution image synthesis. arXiv preprint arXiv:2307.01952 (2023)."},{"key":"e_1_3_2_1_25_1","volume-title":"International conference on machine learning. PMLR, 8748--8763","author":"Radford Alec","year":"2021","unstructured":"Alec Radford, Jong Wook Kim, Chris Hallacy, Aditya Ramesh, Gabriel Goh, Sandhini Agarwal, Girish Sastry, Amanda Askell, Pamela Mishkin, Jack Clark, et al. 2021. Learning transferable visual models from natural language supervision. In International conference on machine learning. PMLR, 8748--8763."},{"key":"e_1_3_2_1_26_1","volume-title":"Photo of burning house. https:\/\/unsplash.com\/photos\/photo-of-burning-house-hLUTRzcVkqg Retrieved","author":"Radford Stephen","year":"2024","unstructured":"Stephen Radford. 2015. Photo of burning house. https:\/\/unsplash.com\/photos\/photo-of-burning-house-hLUTRzcVkqg Retrieved April 20, 2024 from"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1410"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"crossref","unstructured":"A. R\u00f6ssler D. Cozzolino L. Verdoliva C. Riess J. Thies and M. Nie\u00dfner. 2019. FaceForensics: Learning to Detect Manipulated Facial Images. arxiv: 1901.08971 [cs.CV]","DOI":"10.1109\/ICCV.2019.00009"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P16-1162"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1145\/3652583.3657601"},{"key":"e_1_3_2_1_32_1","volume-title":"Woman in Viral Photo Misidentified as Rep. Omar. https:\/\/www.factcheck.org\/2019\/09\/woman-in-viral-photo-misidentified-as-rep-omar\/ Retrieved","author":"Spencer Saranac Hale","year":"2024","unstructured":"Saranac Hale Spencer. 2019. Woman in Viral Photo Misidentified as Rep. Omar. https:\/\/www.factcheck.org\/2019\/09\/woman-in-viral-photo-misidentified-as-rep-omar\/ Retrieved April 20, 2024 from"},{"key":"e_1_3_2_1_33_1","volume-title":"https:\/\/unsplash.com\/photos\/gray-bridge-lzcDi7-MWL4 Retrieved","author":"Stern Ozzie","year":"2024","unstructured":"Ozzie Stern. 2019. Gray Bridge. https:\/\/unsplash.com\/photos\/gray-bridge-lzcDi7-MWL4 Retrieved April 20, 2024 from"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1145\/3652583.3657596"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1145\/3652583.3657600"},{"key":"e_1_3_2_1_36_1","volume-title":"International Conference on Machine Learning. PMLR, 23318--23340","author":"Wang Peng","year":"2022","unstructured":"Peng Wang, An Yang, Rui Men, Junyang Lin, Shuai Bai, Zhikang Li, Jianxin Ma, Chang Zhou, Jingren Zhou, and Hongxia Yang. 2022. Ofa: Unifying architectures, tasks, and modalities through a simple sequence-to-sequence learning framework. In International Conference on Machine Learning. PMLR, 23318--23340."},{"key":"e_1_3_2_1_37_1","unstructured":"J. Waterson. 2019. Facebook refuses to delete fake Pelosi video spread by Trump supporters. https:\/\/www.theguardian.com\/technology\/2019\/may\/24\/facebook-leaves-fake-nancy-pelosi-video-on-site Retrieved April 20 2024 from https:\/\/www.theguardian.com\/technology\/2019\/may\/24\/facebook-leaves-fake-nancy-pelosi-video-on-site"}],"event":{"name":"ICMR '24: International Conference on Multimedia Retrieval","location":"Phuket Thailand","acronym":"ICMR '24","sponsor":["SIGMM ACM Special Interest Group on Multimedia","SIGSOFT ACM Special Interest Group on Software Engineering"]},"container-title":["Proceedings of the 2024 International Conference on Multimedia Retrieval"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3652583.3657587","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3652583.3657587","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,21]],"date-time":"2025-08-21T08:50:28Z","timestamp":1755766228000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3652583.3657587"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,5,30]]},"references-count":37,"alternative-id":["10.1145\/3652583.3657587","10.1145\/3652583"],"URL":"https:\/\/doi.org\/10.1145\/3652583.3657587","relation":{},"subject":[],"published":{"date-parts":[[2024,5,30]]},"assertion":[{"value":"2024-06-07","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}