{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,5,31]],"date-time":"2025-05-31T04:09:23Z","timestamp":1748664563596,"version":"3.41.0"},"publisher-location":"Cham","reference-count":84,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031926471","type":"print"},{"value":"9783031926488","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-92648-8_19","type":"book-chapter","created":{"date-parts":[[2025,5,30]],"date-time":"2025-05-30T16:29:07Z","timestamp":1748622547000},"page":"316-332","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Detect Fake with\u00a0Fake: Leveraging Synthetic Data-Driven Representation for\u00a0Synthetic Image Detection"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0009-0000-3382-3079","authenticated-orcid":false,"given":"Hina","family":"Otake","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8892-5339","authenticated-orcid":false,"given":"Yoshihiro","family":"Fukuhara","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5448-7828","authenticated-orcid":false,"given":"Yoshiki","family":"Kubotani","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8859-6539","authenticated-orcid":false,"given":"Shigeo","family":"Morishima","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,5,12]]},"reference":[{"key":"19_CR1","doi-asserted-by":"crossref","unstructured":"Agarwal, S., Farid, H.: Photo forensics from jpeg dimples. In: 2017 IEEE Workshop on Information Forensics and Security (WIFS), pp.\u00a01\u20136. IEEE (2017)","DOI":"10.1109\/WIFS.2017.8267641"},{"key":"19_CR2","doi-asserted-by":"crossref","unstructured":"Azizpour, A., Nguyen, T.D., Shrestha, M., Xu, K., Kim, E., Stamm, M.C.: E3: ensemble of expert embedders for adapting synthetic image detectors to new generators using limited data. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4334\u20134344 (2024)","DOI":"10.1109\/CVPRW63382.2024.00437"},{"key":"19_CR3","unstructured":"Bachmann, R., et al.: 4M-21: an any-to-any vision model for tens of tasks and modalities. arXiv 2024 (2024)"},{"key":"19_CR4","unstructured":"Baradad, M., et al.: Procedural image programs for representation learning. In: Oh, A.H., Agarwal, A., Belgrave, D., Cho, K. (eds.) Advances in Neural Information Processing Systems (2022). https:\/\/openreview.net\/forum?id=wJwHTgIoE0P"},{"key":"19_CR5","unstructured":"Baradad, M., Wulff, J., Wang, T., Isola, P., Torralba, A.: Learning to see by looking at noise. In: Advances in Neural Information Processing Systems (2021)"},{"key":"19_CR6","unstructured":"Brock, A., Donahue, J., Simonyan, K.: Large scale GAN training for high fidelity natural image synthesis. arXiv preprint arXiv:1809.11096 (2018)"},{"key":"19_CR7","doi-asserted-by":"crossref","unstructured":"Cardenuto, J.P., et\u00a0al.: The age of synthetic realities: challenges and opportunities. APSIPA Trans. Signal Inf. Process. 12(1) (2023)","DOI":"10.1561\/116.00000138"},{"key":"19_CR8","doi-asserted-by":"crossref","unstructured":"Caron, M., et al.: Emerging properties in self-supervised vision transformers. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 9650\u20139660 (2021)","DOI":"10.1109\/ICCV48922.2021.00951"},{"key":"19_CR9","doi-asserted-by":"crossref","unstructured":"Chen, C., Chen, Q., Xu, J., Koltun, V.: Learning to see in the dark. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3291\u20133300 (2018)","DOI":"10.1109\/CVPR.2018.00347"},{"key":"19_CR10","doi-asserted-by":"crossref","unstructured":"Chen, L., Zhang, Y., Song, Y., Liu, L., Wang, J.: Self-supervised learning of adversarial example: towards good generalizations for deepfake detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 18710\u201318719 (2022)","DOI":"10.1109\/CVPR52688.2022.01815"},{"key":"19_CR11","doi-asserted-by":"crossref","unstructured":"Chen, Q., Koltun, V.: Photographic image synthesis with cascaded refinement networks. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1511\u20131520 (2017)","DOI":"10.1109\/ICCV.2017.168"},{"key":"19_CR12","doi-asserted-by":"crossref","unstructured":"Chen, R., Chen, X., Ni, B., Ge, Y.: Simswap: an efficient framework for high fidelity face swapping. In: Proceedings of the 28th ACM International Conference on Multimedia, pp. 2003\u20132011 (2020)","DOI":"10.1145\/3394171.3413630"},{"key":"19_CR13","doi-asserted-by":"crossref","unstructured":"Choi, Y., Choi, M., Kim, M., Ha, J.W., Kim, S., Choo, J.: Stargan: unified generative adversarial networks for multi-domain image-to-image translation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2018)","DOI":"10.1109\/CVPR.2018.00916"},{"key":"19_CR14","doi-asserted-by":"crossref","unstructured":"Choi, Y., Uh, Y., Yoo, J., Ha, J.W.: Stargan v2: diverse image synthesis for multiple domains. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 8188\u20138197 (2020)","DOI":"10.1109\/CVPR42600.2020.00821"},{"key":"19_CR15","doi-asserted-by":"crossref","unstructured":"Cozzolino, D., Poggi, G., Corvi, R., Nie\u00dfner, M., Verdoliva, L.: Raising the bar of AI-generated image detection with clip. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4356\u20134366 (2024)","DOI":"10.1109\/CVPRW63382.2024.00439"},{"key":"19_CR16","unstructured":"Cozzolino, D., Thies, J., R\u00f6ssler, A., Riess, C., Nie\u00dfner, M., Verdoliva, L.: Forensictransfer: weakly-supervised domain adaptation for forgery detection. arXiv preprint arXiv:1812.02510 (2018)"},{"key":"19_CR17","doi-asserted-by":"crossref","unstructured":"Dai, T., Cai, J., Zhang, Y., Xia, S.T., Zhang, L.: Second-order attention network for single image super-resolution. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 11065\u201311074 (2019)","DOI":"10.1109\/CVPR.2019.01132"},{"key":"19_CR18","unstructured":"Darcet, T., Oquab, M., Mairal, J., Bojanowski, P.: Vision transformers need registers. arXiv preprint arXiv:2309.16588 (2023)"},{"key":"19_CR19","first-page":"8780","volume":"34","author":"P Dhariwal","year":"2021","unstructured":"Dhariwal, P., Nichol, A.: Diffusion models beat GANs on image synthesis. Adv. Neural. Inf. Process. Syst. 34, 8780\u20138794 (2021)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"19_CR20","unstructured":"Dosovitskiy, A., et al.: An image is worth 16x16 words: transformers for image recognition at scale. arXiv preprint arXiv:2010.11929 (2020)"},{"key":"19_CR21","doi-asserted-by":"publisher","unstructured":"Essa, E.: Feature fusion vision transformers using MLP-mixer for enhanced deepfake detection. Neurocomputing 128128 (2024). https:\/\/doi.org\/10.1016\/j.neucom.2024.128128. https:\/\/www.sciencedirect.com\/science\/article\/pii\/S0925231224008993","DOI":"10.1016\/j.neucom.2024.128128"},{"key":"19_CR22","doi-asserted-by":"crossref","unstructured":"Fan, L., Chen, K., Krishnan, D., Katabi, D., Isola, P., Tian, Y.: Scaling laws of synthetic images for model training ... for now. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 7382\u20137392 (2024)","DOI":"10.1109\/CVPR52733.2024.00705"},{"key":"19_CR23","unstructured":"Frank, J., Eisenhofer, T., Sch\u00f6nherr, L., Fischer, A., Kolossa, D., Holz, T.: Leveraging frequency analysis for deep fake image recognition. In: International Conference on Machine Learning, pp. 3247\u20133258. PMLR (2020)"},{"key":"19_CR24","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"19_CR25","doi-asserted-by":"crossref","unstructured":"Hl, D.S., Thomas, S.M., et\u00a0al.: A multimodal approach integrating convolutional and recurrent neural networks for Alzheimer\u2019s disease temporal progression prediction. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5207\u20135215 (2024)","DOI":"10.1109\/CVPRW63382.2024.00529"},{"key":"19_CR26","doi-asserted-by":"publisher","unstructured":"Ilharco, G., et al.: Openclip (2021). https:\/\/doi.org\/10.5281\/zenodo.5143773","DOI":"10.5281\/zenodo.5143773"},{"key":"19_CR27","doi-asserted-by":"crossref","unstructured":"Kang, M., et al.: Scaling up GANs for text-to-image synthesis. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2023)","DOI":"10.1109\/CVPR52729.2023.00976"},{"key":"19_CR28","unstructured":"Karras, T., Aila, T., Laine, S., Lehtinen, J.: Progressive growing of GANs for improved quality, stability, and variation. arXiv preprint arXiv:1710.10196 (2017)"},{"key":"19_CR29","doi-asserted-by":"crossref","unstructured":"Karras, T., Laine, S., Aila, T.: A style-based generator architecture for generative adversarial networks. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4401\u20134410 (2019)","DOI":"10.1109\/CVPR.2019.00453"},{"key":"19_CR30","doi-asserted-by":"crossref","unstructured":"Karras, T., Laine, S., Aittala, M., Hellsten, J., Lehtinen, J., Aila, T.: Analyzing and improving the image quality of stylegan. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 8110\u20138119 (2020)","DOI":"10.1109\/CVPR42600.2020.00813"},{"key":"19_CR31","doi-asserted-by":"publisher","unstructured":"Kataoka, H., et al.: Replacing labeled real-image datasets with auto-generated contours. In: 2022 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 21200\u201321209 (2022). https:\/\/doi.org\/10.1109\/CVPR52688.2022.02055","DOI":"10.1109\/CVPR52688.2022.02055"},{"key":"19_CR32","doi-asserted-by":"crossref","unstructured":"Kataoka, H., et al.: Pre-training without natural images. In: Asian Conference on Computer Vision (ACCV) (2020)","DOI":"10.1007\/978-3-030-69544-6_35"},{"key":"19_CR33","doi-asserted-by":"crossref","unstructured":"Koutlis, C., Papadopoulos, S.: Leveraging representations from intermediate encoder-blocks for synthetic image detection. arXiv preprint arXiv:2402.19091 (2024)","DOI":"10.1007\/978-3-031-73220-1_23"},{"key":"19_CR34","doi-asserted-by":"crossref","unstructured":"Li, K., Zhang, T., Malik, J.: Diverse image synthesis from semantic layouts via conditional IMLE. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 4220\u20134229 (2019)","DOI":"10.1109\/ICCV.2019.00432"},{"key":"19_CR35","unstructured":"Li, L., Bao, J., Yang, H., Chen, D., Wen, F.: Faceshifter: towards high fidelity and occlusion aware face swapping. arXiv preprint arXiv:1912.13457 (2019)"},{"key":"19_CR36","doi-asserted-by":"crossref","unstructured":"Lin, L., et al.: Detecting multimedia generated by large AI models: a survey. arXiv preprint arXiv:2402.00045 (2024)","DOI":"10.36227\/techrxiv.170723324.44685515\/v1"},{"issue":"4","key":"19_CR37","doi-asserted-by":"publisher","first-page":"598","DOI":"10.1109\/83.913594","volume":"10","author":"C Liu","year":"2001","unstructured":"Liu, C., Wechsler, H.: A shape-and texture-based enhanced fisher classifier for face recognition. IEEE Trans. Image Process. 10(4), 598\u2013608 (2001)","journal-title":"IEEE Trans. Image Process."},{"key":"19_CR38","doi-asserted-by":"crossref","unstructured":"Liu, H., Tan, Z., Tan, C., Wei, Y., Wang, J., Zhao, Y.: Forgery-aware adaptive transformer for generalizable synthetic image detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10770\u201310780 (2024)","DOI":"10.1109\/CVPR52733.2024.01024"},{"key":"19_CR39","unstructured":"Liu, Z., Wang, H., Kang, Y., Wang, S.: Mixture of low-rank experts for transferable AI-generated image detection. arXiv preprint arXiv:2404.04883 (2024)"},{"key":"19_CR40","doi-asserted-by":"crossref","unstructured":"Luo, A., Kong, C., Huang, J., Hu, Y., Kang, X., Kot, A.C.: Beyond the prior forgery knowledge: mining critical clues for general face forgery detection (2023)","DOI":"10.1109\/TIFS.2023.3332218"},{"key":"19_CR41","doi-asserted-by":"crossref","unstructured":"Marra, F., Gragnaniello, D., Cozzolino, D., Verdoliva, L.: Detection of GAN-generated fake images over social networks. In: 2018 IEEE Conference on Multimedia Information Processing and Retrieval (MIPR), pp. 384\u2013389. IEEE (2018)","DOI":"10.1109\/MIPR.2018.00084"},{"key":"19_CR42","doi-asserted-by":"publisher","unstructured":"Marra, F., Gragnaniello, D., Verdoliva, L., Poggi, G.: Do GANs leave artificial fingerprints? In: 2019 IEEE Conference on Multimedia Information Processing and Retrieval (MIPR), pp. 506\u2013511 (2019). https:\/\/doi.org\/10.1109\/MIPR.2019.00103","DOI":"10.1109\/MIPR.2019.00103"},{"key":"19_CR43","doi-asserted-by":"crossref","unstructured":"McInnes, L., Healy, J., Melville, J.: UMAP: uniform manifold approximation and projection for dimension reduction. arXiv preprint arXiv:1802.03426 (2018)","DOI":"10.21105\/joss.00861"},{"key":"19_CR44","unstructured":"Midjourney, I.: Malicious actors manipulating photos and videos to create explicit content and sextortion schemes. https:\/\/www.midjourney.com\/ (2022)"},{"key":"19_CR45","unstructured":"Mizrahi, D., et al.: 4M: massively multimodal masked modeling. In: Thirty-Seventh Conference on Neural Information Processing Systems (2023)"},{"key":"19_CR46","doi-asserted-by":"publisher","unstructured":"Nakashima, K., Kataoka, H., Matsumoto, A., Iwata, K., Inoue, N., Satoh, Y.: Can vision transformers learn without natural images? In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 36, no. 2, pp. 1990\u20131998 (2022). https:\/\/doi.org\/10.1609\/aaai.v36i2.20094. https:\/\/ojs.aaai.org\/index.php\/AAAI\/article\/view\/20094","DOI":"10.1609\/aaai.v36i2.20094"},{"key":"19_CR47","doi-asserted-by":"crossref","unstructured":"Nguyen, H.H., Yamagishi, J., Echizen, I.: Exploring self-supervised vision transformers for deepfake detection: a comparative analysis. arXiv preprint arXiv:2405.00355 (2024)","DOI":"10.1109\/IJCB62174.2024.10744497"},{"key":"19_CR48","unstructured":"Nichol, A., et al.: Glide: towards photorealistic image generation and editing with text-guided diffusion models. arXiv preprint arXiv:2112.10741 (2021)"},{"key":"19_CR49","doi-asserted-by":"crossref","unstructured":"Nirkin, Y., Keller, Y., Hassner, T.: Fsgan: subject agnostic face swapping and reenactment. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 7184\u20137193 (2019)","DOI":"10.1109\/ICCV.2019.00728"},{"key":"19_CR50","doi-asserted-by":"publisher","unstructured":"O\u2019Brien, J.F., Farid, H.: Exposing photo manipulation with inconsistent reflections. ACM Trans. Graph. 31(1) (2012). https:\/\/doi.org\/10.1145\/2077341.2077345","DOI":"10.1145\/2077341.2077345"},{"key":"19_CR51","doi-asserted-by":"crossref","unstructured":"Ojha, U., Li, Y., Lee, Y.J.: Towards universal fake image detectors that generalize across generative models. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 24480\u201324489 (2023)","DOI":"10.1109\/CVPR52729.2023.02345"},{"key":"19_CR52","unstructured":"van\u00a0den Oord, A., Vinyals, O., Kavukcuoglu, K.: Neural discrete representation learning (2018)"},{"key":"19_CR53","unstructured":"OpenAI: Dall$$\\cdot $$e 3 system card (2023). https:\/\/openai.com\/research\/dall-e-3-system-card"},{"key":"19_CR54","unstructured":"Oquab, M., et al.: Dinov2: learning robust visual features without supervision (2023)"},{"key":"19_CR55","doi-asserted-by":"crossref","unstructured":"Park, T., Liu, M.Y., Wang, T.C., Zhu, J.Y.: Semantic image synthesis with spatially-adaptive normalization. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 2337\u20132346 (2019)","DOI":"10.1109\/CVPR.2019.00244"},{"issue":"2","key":"19_CR56","doi-asserted-by":"publisher","first-page":"758","DOI":"10.1109\/TSP.2004.839932","volume":"53","author":"AC Popescu","year":"2005","unstructured":"Popescu, A.C., Farid, H.: Exposing digital forgeries by detecting traces of resampling. IEEE Trans. Signal Process. 53(2), 758\u2013767 (2005)","journal-title":"IEEE Trans. Signal Process."},{"key":"19_CR57","doi-asserted-by":"crossref","unstructured":"Pumarola, A., Agudo, A., Martinez, A.M., Sanfeliu, A., Moreno-Noguer, F.: Ganimation: anatomically-aware facial animation from a single image. In: Proceedings of the European Conference on Computer Vision (ECCV) (2018)","DOI":"10.1007\/978-3-030-01249-6_50"},{"key":"19_CR58","unstructured":"Radford, A., et\u00a0al.: Learning transferable visual models from natural language supervision. In: International Conference on Machine Learning, pp. 8748\u20138763. PMLR (2021)"},{"key":"19_CR59","unstructured":"Ramesh, A., Dhariwal, P., Nichol, A., Chu, C., Chen, M.: Hierarchical text-conditional image generation with clip latents. arXiv:2204.061251(2), 3 (2022)"},{"key":"19_CR60","unstructured":"Ramesh, A., et al.: Zero-shot text-to-image generation. In: International Conference on Machine Learning, pp. 8821\u20138831. PMLR (2021)"},{"key":"19_CR61","unstructured":"Razavi, A., van\u00a0den Oord, A., Vinyals, O.: Generating diverse high-fidelity images with VQ-VAE-2 (2019)"},{"key":"19_CR62","doi-asserted-by":"crossref","unstructured":"Rombach, R., Blattmann, A., Lorenz, D., Esser, P., Ommer, B.: High-resolution image synthesis with latent diffusion models. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 10684\u201310695 (2022)","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"19_CR63","doi-asserted-by":"crossref","unstructured":"Rombach, R., Blattmann, A., Lorenz, D., Esser, P., Ommer, B.: High-resolution image synthesis with latent diffusion models. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10684\u201310695 (2022)","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"19_CR64","doi-asserted-by":"crossref","unstructured":"Rossler, A., Cozzolino, D., Verdoliva, L., Riess, C., Thies, J., Nie\u00dfner, M.: Faceforensics++: learning to detect manipulated facial images. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 1\u201311 (2019)","DOI":"10.1109\/ICCV.2019.00009"},{"key":"19_CR65","unstructured":"Saharia, C., et al.: Photorealistic text-to-image diffusion models with deep language understanding (2022)"},{"key":"19_CR66","unstructured":"Schuhmann, C., et al.: Laion-5b: an open large-scale dataset for training next generation image-text models. In: Koyejo, S., Mohamed, S., Agarwal, A., Belgrave, D., Cho, K., Oh, A. (eds.) Advances in Neural Information Processing Systems, vol.\u00a035, pp. 25278\u201325294. Curran Associates, Inc. (2022). https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2022\/file\/a1859debfb3b59d094f3504d5ebb6c25-Paper-Datasets_and_Benchmarks.pdf"},{"key":"19_CR67","unstructured":"Schuhmann, C., et al.: Laion-400m: open dataset of clip-filtered 400 million image-text pairs. arXiv preprint arXiv:2111.02114 (2021)"},{"key":"19_CR68","unstructured":"Shahid, S.M., Padhi, S.K., Kashyap, U., Ali, S.S.: Generalized deepfake attribution. arXiv preprint arXiv:2406.18278 (2024)"},{"key":"19_CR69","doi-asserted-by":"crossref","unstructured":"Shiohara, K., Yamasaki, T.: Detecting deepfakes with self-blended images. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 18720\u201318729 (2022)","DOI":"10.1109\/CVPR52688.2022.01816"},{"key":"19_CR70","doi-asserted-by":"crossref","unstructured":"Singh, K., Navaratnam, T., Holmer, J., Schaub-Meyer, S., Roth, S.: Is synthetic data all we need? Benchmarking the robustness of models trained with synthetic images. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops, pp. 2505\u20132515 (2024)","DOI":"10.1109\/CVPRW63382.2024.00257"},{"key":"19_CR71","doi-asserted-by":"crossref","unstructured":"Takashima, S., Hayamizu, R., Inoue, N., Kataoka, H., Yokota, R.: Visual atoms: pre-training vision transformers with sinusoidal waves. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 18579\u201318588 (2023)","DOI":"10.1109\/CVPR52729.2023.01782"},{"issue":"12","key":"19_CR72","doi-asserted-by":"publisher","first-page":"2437","DOI":"10.1016\/j.patcog.2004.12.013","volume":"38","author":"QS Sun","year":"2005","unstructured":"Sun, Q.S., Zeng, S.G., Liu, Y., Heng, P.A., Xia, D.S.: A new method of feature fusion and its application in image recognition. Pattern Recogn. 38(12), 2437\u20132448 (2005)","journal-title":"Pattern Recogn."},{"key":"19_CR73","doi-asserted-by":"crossref","unstructured":"Tan, C., Zhao, Y., Wei, S., Gu, G., Liu, P., Wei, Y.: Rethinking the up-sampling operations in CNN-based generative network for generalizable deepfake detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 28130\u201328139 (2024)","DOI":"10.1109\/CVPR52733.2024.02657"},{"key":"19_CR74","doi-asserted-by":"crossref","unstructured":"Tan, C., Zhao, Y., Wei, S., Gu, G., Wei, Y.: Learning on gradients: generalized artifacts representation for GAN-generated images detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 12105\u201312114 (2023)","DOI":"10.1109\/CVPR52729.2023.01165"},{"key":"19_CR75","doi-asserted-by":"crossref","unstructured":"Thies, J., Zollhofer, M., Stamminger, M., Theobalt, C., Nie\u00dfner, M.: Face2face: real-time face capture and reenactment of RGB videos. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2387\u20132395 (2016)","DOI":"10.1109\/CVPR.2016.262"},{"key":"19_CR76","doi-asserted-by":"crossref","unstructured":"Tian, Y., Fan, L., Chen, K., Katabi, D., Krishnan, D., Isola, P.: Learning vision from models rivals learning vision from data. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 15887\u201315898 (2024)","DOI":"10.1109\/CVPR52733.2024.01504"},{"key":"19_CR77","unstructured":"Tian, Y., Fan, L., Isola, P., Chang, H., Krishnan, D.: Stablerep: synthetic images from text-to-image models make strong visual representation learners. In: Oh, A., Naumann, T., Globerson, A., Saenko, K., Hardt, M., Levine, S. (eds.) Advances in Neural Information Processing Systems, vol.\u00a036, pp. 48382\u201348402. Curran Associates, Inc. (2023). https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2023\/file\/971f1e59cd956cc094da4e2f78c6ea7c-Paper-Conference.pdf"},{"key":"19_CR78","doi-asserted-by":"publisher","DOI":"10.1016\/j.compbiomed.2022.105901","volume":"148","author":"Y Tu","year":"2022","unstructured":"Tu, Y., Lin, S., Qiao, J., Zhuang, Y., Zhang, P.: Alzheimer\u2019s disease diagnosis via multimodal feature fusion. Comput. Biol. Med. 148, 105901 (2022)","journal-title":"Comput. Biol. Med."},{"key":"19_CR79","doi-asserted-by":"crossref","unstructured":"Wang, S.Y., Wang, O., Zhang, R., Owens, F., Efros, A.A.: CNN-generated images are surprisingly easy to spot... for now. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 8695\u20138704 (2020)","DOI":"10.1109\/CVPR42600.2020.00872"},{"key":"19_CR80","doi-asserted-by":"crossref","unstructured":"Xu, Z., et al.: Styleswap: style-based generator empowers robust face swapping. In: European Conference on Computer Vision, pp. 661\u2013677. Springer (2022)","DOI":"10.1007\/978-3-031-19781-9_38"},{"key":"19_CR81","doi-asserted-by":"crossref","unstructured":"Yan, Z., Luo, Y., Lyu, S., Liu, Q., Wu, B.: Transcending forgery specificity with latent space augmentation for generalizable deepfake detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 8984\u20138994 (2024)","DOI":"10.1109\/CVPR52733.2024.00858"},{"key":"19_CR82","doi-asserted-by":"crossref","unstructured":"Yu, N., Davis, L., Fritz, M.: Attributing fake images to GANs: learning and analyzing GAN fingerprints. In: IEEE International Conference on Computer Vision (ICCV) (2019)","DOI":"10.1109\/ICCV.2019.00765"},{"key":"19_CR83","doi-asserted-by":"crossref","unstructured":"Zhang, X., Karaman, S., Chang, S.F.: Detecting and simulating artifacts in GAN fake images. In: 2019 IEEE International Workshop on Information Forensics and Security (WIFS), pp.\u00a01\u20136. IEEE (2019)","DOI":"10.1109\/WIFS47025.2019.9035107"},{"key":"19_CR84","doi-asserted-by":"crossref","unstructured":"Zhu, J.Y., Park, T., Isola, P., Efros, A.A.: Unpaired image-to-image translation using cycle-consistent adversarial networks. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2223\u20132232 (2017)","DOI":"10.1109\/ICCV.2017.244"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024 Workshops"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-92648-8_19","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,30]],"date-time":"2025-05-30T16:29:25Z","timestamp":1748622565000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-92648-8_19"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9783031926471","9783031926488"],"references-count":84,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-92648-8_19","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"12 May 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}