{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,22]],"date-time":"2026-05-22T03:05:18Z","timestamp":1779419118512,"version":"3.53.1"},"publisher-location":"Singapore","reference-count":27,"publisher":"Springer Nature Singapore","isbn-type":[{"value":"9789819500086","type":"print"},{"value":"9789819500093","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-981-95-0009-3_31","type":"book-chapter","created":{"date-parts":[[2025,7,24]],"date-time":"2025-07-24T13:25:04Z","timestamp":1753363504000},"page":"362-373","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["DDformer: Deepfake Detection with Multimodal Fusion Transformer"],"prefix":"10.1007","author":[{"given":"Jiazhan","family":"Gao","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Deqi","family":"Huang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jinlai","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Eksan","family":"Firkat","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Chao","family":"Liu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jihong","family":"Zhu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2025,7,25]]},"reference":[{"key":"31_CR1","unstructured":"Goodfellow, I., et al.: Generative adversarial nets. In: Advances in Neural Information Processing Systems, vol. 27 (2014)"},{"key":"31_CR2","unstructured":"deepfakes: faceswap. GitHub repository (2019). https:\/\/github.com\/deepfakes\/faceswap"},{"key":"31_CR3","doi-asserted-by":"publisher","first-page":"120646","DOI":"10.1016\/j.eswa.2023.120646","volume":"231","author":"Y Li","year":"2023","unstructured":"Li, Y., Bian, S., Wang, C., Polat, K., Alhudhaif, A., Alenezi, F.: Exposing low-quality deepfake videos of social network service using spatial restored detection framework. Expert Syst. Appl. 231, 120646 (2023)","journal-title":"Expert Syst. Appl."},{"issue":"09","key":"31_CR4","doi-asserted-by":"publisher","first-page":"2350015","DOI":"10.1142\/S0218001423500155","volume":"37","author":"HC Chang","year":"2023","unstructured":"Chang, H.C.: Deepfake speech recognition and detection. Int. J. Pattern Recognit Artif Intell. 37(09), 2350015 (2023)","journal-title":"Int. J. Pattern Recognit Artif Intell."},{"key":"31_CR5","unstructured":"Blue, L., et al.: Who are you (i really wanna know)? Detecting audio DeepFakes through vocal tract reconstruction. In: 31st USENIX Security Symposium (USENIX Security 2022), pp. 2691\u20132708 (2022)"},{"key":"31_CR6","doi-asserted-by":"publisher","first-page":"2078","DOI":"10.1109\/LSP.2022.3205562","volume":"29","author":"B Chu","year":"2022","unstructured":"Chu, B., You, W., Yang, Z., Zhou, L., Wang, R.: Protecting world leader using facial speaking pattern against deepfakes. IEEE Signal Process. Lett. 29, 2078\u20132082 (2022)","journal-title":"IEEE Signal Process. Lett."},{"key":"31_CR7","doi-asserted-by":"publisher","first-page":"118423","DOI":"10.1016\/j.eswa.2022.118423","volume":"210","author":"S Ganguly","year":"2022","unstructured":"Ganguly, S., Ganguly, A., Mohiuddin, S., Malakar, S., Sarkar, R.: Vixnet: vision transformer with xception network for deepfakes based video and image forgery detection. Expert Syst. Appl. 210, 118423 (2022)","journal-title":"Expert Syst. Appl."},{"key":"31_CR8","doi-asserted-by":"crossref","unstructured":"Tian, K., Chen, C., Zhou, Y., Hu, X.: Illumination enlightened spatial-temporal inconsistency for deepfake video detection. In: 2024 IEEE International Conference on Multimedia and Expo (ICME), p.6. IEEE (2024)","DOI":"10.1109\/ICME57554.2024.10687905"},{"key":"31_CR9","doi-asserted-by":"crossref","unstructured":"Guarnera, L., Giudice, O., Battiato, S.: Deepfake detection by analyzing convolutional traces. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops, pp. 666\u2013667 (2020)","DOI":"10.1109\/CVPRW50498.2020.00341"},{"key":"31_CR10","doi-asserted-by":"crossref","unstructured":"Li, L., et al.: Face x-ray for more general face forgery detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5001\u20135010 (2020)","DOI":"10.1109\/CVPR42600.2020.00505"},{"issue":"10","key":"31_CR11","doi-asserted-by":"publisher","first-page":"6111","DOI":"10.1109\/TPAMI.2021.3093446","volume":"44","author":"Y Nirkin","year":"2021","unstructured":"Nirkin, Y., Wolf, L., Keller, Y., Hassner, T.: Deepfake detection based on discrepancies between faces and their context. IEEE Trans. Pattern Anal. Mach. Intell. 44(10), 6111\u20136121 (2021)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"31_CR12","doi-asserted-by":"crossref","unstructured":"Zhao, H., Zhou, W., Chen, D., Wei, T., Zhang, W., Yu, N.: Multi-attentional deepfake detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 2185\u20132194 (2021)","DOI":"10.1109\/CVPR46437.2021.00222"},{"key":"31_CR13","doi-asserted-by":"crossref","unstructured":"Wang, Y., Yu, K., Chen, C., Hu, X., Peng, S.: Dynamic graph learning with content-guided spatial-frequency relation reasoning for deepfake detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7278\u20137287 (2023)","DOI":"10.1109\/CVPR52729.2023.00703"},{"key":"31_CR14","doi-asserted-by":"crossref","unstructured":"Guera, D., Delp, E.J.: Deepfake video detection using recurrent neural networks. In: 2018 15th IEEE International Conference on Advanced Video and Signal Based Surveillance (AVSS), pp. 1\u20136. IEEE (2018)","DOI":"10.1109\/AVSS.2018.8639163"},{"key":"31_CR15","doi-asserted-by":"crossref","unstructured":"Montserrat, D.M., et al.: Deepfakes detection with automatic face weighting. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops, pp. 668\u2013669 (2020)","DOI":"10.1109\/CVPRW50498.2020.00342"},{"key":"31_CR16","doi-asserted-by":"crossref","unstructured":"Ashok, V., Joy, P.T.: Deepfake detection using xceptionnet. In: 2023 IEEE International Conference on Recent Advances in Systems Science and Engineering (RASSE), pp. 1\u20135 (2023)","DOI":"10.1109\/RASSE60029.2023.10363477"},{"key":"31_CR17","doi-asserted-by":"crossref","unstructured":"Raza, M.A., Malik, K.M.: Multimodaltrace: deepfake detection using audiovisual representation learning. In: 2023 IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops (CVPRW), pp. 993\u20131000 (2023)","DOI":"10.1109\/CVPRW59228.2023.00106"},{"key":"31_CR18","doi-asserted-by":"publisher","first-page":"583","DOI":"10.1016\/j.neucom.2022.06.013","volume":"501","author":"M Yu","year":"2022","unstructured":"Yu, M., Ju, S., Zhang, J., Li, S., Lei, J., Li, X.: Patch-DFD: patch-based end-to-end deepfake discriminator. Neurocomputing 501, 583\u2013595 (2022)","journal-title":"Neurocomputing"},{"key":"31_CR19","doi-asserted-by":"crossref","unstructured":"Oorloff, T., et al.: AVFF: audio-visual feature fusion for video deepfake detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 27102\u201327112 (2024)","DOI":"10.1109\/CVPR52733.2024.02559"},{"key":"31_CR20","doi-asserted-by":"crossref","unstructured":"Zhou, Y., Lim, S.N.: Joint audio-visual deepfake detection. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 14800\u201314809 (2021)","DOI":"10.1109\/ICCV48922.2021.01453"},{"key":"31_CR21","doi-asserted-by":"crossref","unstructured":"Oorloff, T., et al.: AVFF: audio-visual feature fusion for video deepfake detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 27102\u201327112 (2024)","DOI":"10.1109\/CVPR52733.2024.02559"},{"issue":"5","key":"31_CR22","first-page":"1","volume":"20","author":"Y Zhang","year":"2024","unstructured":"Zhang, Y., Lin, W., Xu, J.: Joint audio-visual attention with contrastive learning for more general deepfake detection. ACM Trans. Multimed. Comput. Commun. Appl. 20(5), 1\u201323 (2024)","journal-title":"ACM Trans. Multimed. Comput. Commun. Appl."},{"key":"31_CR23","doi-asserted-by":"publisher","first-page":"2015","DOI":"10.1109\/TIFS.2023.3262148","volume":"18","author":"W Yang","year":"2023","unstructured":"Yang, W., et al.: AVoiD-DF: audio-visual joint learning for detecting deepfake. IEEE Trans. Inf. Forensics Secur. 18, 2015\u20132029 (2023)","journal-title":"IEEE Trans. Inf. Forensics Secur."},{"issue":"3","key":"31_CR24","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3625231","volume":"20","author":"H Cheng","year":"2023","unstructured":"Cheng, H., Guo, Y., Wang, T., Li, Q., Chang, X., Nie, L.: Voice-face homogeneity tells deepfake. ACM Trans. Multimed. Comput. Commun. Appl. 20(3), 1\u201322 (2023)","journal-title":"ACM Trans. Multimed. Comput. Commun. Appl."},{"key":"31_CR25","doi-asserted-by":"publisher","first-page":"110124","DOI":"10.1016\/j.asoc.2023.110124","volume":"136","author":"H Ilyas","year":"2023","unstructured":"Ilyas, H., Javed, A., Malik, K.M.: Avfakenet: a unified end-to-end dense swin transformer deep learning model for audio\u2013visual deepfakes detection. Appl. Soft Comput. 136, 110124 (2023)","journal-title":"Appl. Soft Comput."},{"key":"31_CR26","unstructured":"Vaswani, A., et al.: Attention is all you need. In: Advances in Neural Information Processing Systems, vol. 30 (2017)"},{"key":"31_CR27","unstructured":"Khalid, H., Tariq, S., Kim, M., Woo, S.S.: FakeAVCeleb: a novel audio-video multimodal deepfake dataset. arXiv preprint arXiv:2108.05080 (2021)"}],"container-title":["Lecture Notes in Computer Science","Advanced Intelligent Computing Technology and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-95-0009-3_31","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,22]],"date-time":"2026-05-22T02:21:54Z","timestamp":1779416514000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-95-0009-3_31"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9789819500086","9789819500093"],"references-count":27,"URL":"https:\/\/doi.org\/10.1007\/978-981-95-0009-3_31","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"25 July 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Disclosure of Interests"}},{"value":"ICIC","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Intelligent Computing","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Ningbo","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"China","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26 July 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 July 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"21","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"icic2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.ic-icc.cn\/icg\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}