{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,31]],"date-time":"2026-03-31T13:53:04Z","timestamp":1774965184043,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":53,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,10,27]]},"DOI":"10.1145\/3746027.3755467","type":"proceedings-article","created":{"date-parts":[[2025,10,25]],"date-time":"2025-10-25T05:47:42Z","timestamp":1761371262000},"page":"8379-8388","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":1,"title":["FSCDiff: Frequency-Spatial Entangled Conditional Diffusion model for Underwater Salient Object Detection"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-0740-0691","authenticated-orcid":false,"given":"Hua","family":"Li","sequence":"first","affiliation":[{"name":"Hainan University, Haikou, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-1511-0646","authenticated-orcid":false,"given":"Gaowei","family":"Lin","sequence":"additional","affiliation":[{"name":"Hainan University, Haikou, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-2804-376X","authenticated-orcid":false,"given":"Zhiyuan","family":"Li","sequence":"additional","affiliation":[{"name":"Hainan University, Haikou, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7484-7261","authenticated-orcid":false,"given":"Sam","family":"Kwong","sequence":"additional","affiliation":[{"name":"Lingnan University, Hong Kong, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0972-4008","authenticated-orcid":false,"given":"Runmin","family":"Cong","sequence":"additional","affiliation":[{"name":"Shandong University, Jinan, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2025,10,27]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-023-01762-5"},{"key":"e_1_3_2_1_2_1","first-page":"6007","article-title":"Imagic: Text-based real image editing with diffusion models","author":"Kawar Bahjat","year":"2023","unstructured":"Bahjat Kawar, Shiran Zada, Oran Lang, Omer Tov, Huiwen Chang, Tali Dekel, Inbar Mosseri, and Michal Irani. 2023. Imagic: Text-based real image editing with diffusion models. In CVPR. 6007-6017.","journal-title":"CVPR."},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.compag.2019.105087"},{"key":"e_1_3_2_1_4_1","first-page":"1305","article-title":"WaterMask: Instance Segmentation for Underwater Imagery","author":"Lian Shijie","year":"2023","unstructured":"Shijie Lian, Hua Li, Runmin Cong, Suqi Li, Wei Zhang, and Sam Kwong. 2023. WaterMask: Instance Segmentation for Underwater Imagery. In ICCV. 1305-1315.","journal-title":"ICCV."},{"key":"e_1_3_2_1_5_1","first-page":"1","article-title":"Underwater virtual reality system for neutral buoyancy training: Development and evaluation","author":"Sinnott Christian","year":"2019","unstructured":"Christian Sinnott, James Liu, Courtney Matera, Savannah Halow, Ann Jones, Matthew Moroz, Jeffrey Mulligan, Michael Crognale, Eelke Folmer, and Paul MacNeilage. 2019. Underwater virtual reality system for neutral buoyancy training: Development and evaluation. In ACM MM. 1-9.","journal-title":"ACM MM."},{"key":"e_1_3_2_1_6_1","first-page":"4376","article-title":"An underwater image enhancement benchmark dataset and beyond","volume":"29","author":"Li Chongyi","year":"2019","unstructured":"Chongyi Li, Chunle Guo, Wenqi Ren, Runmin Cong, Junhui Hou, Sam Kwong, and Dacheng Tao. 2019. An underwater image enhancement benchmark dataset and beyond. IEEE TIP, Vol. 29 (2019), 4376-4389.","journal-title":"IEEE TIP"},{"key":"e_1_3_2_1_7_1","first-page":"3696","article-title":"Saliency prototype for RGB-D and RGB-T salient object detection","author":"Zhang Zihao","year":"2023","unstructured":"Zihao Zhang, Jie Wang, and Yahong Han. 2023. Saliency prototype for RGB-D and RGB-T salient object detection. In ACM MM. 3696-3705.","journal-title":"ACM MM."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2025.129718"},{"key":"e_1_3_2_1_9_1","first-page":"2578","article-title":"Fantastic animals and where to find them: Segment any marine animal with dual sam","author":"Zhang Pingping","year":"2024","unstructured":"Pingping Zhang, Tianyu Yan, Yang Liu, and Huchuan Lu. 2024. Fantastic animals and where to find them: Segment any marine animal with dual sam. In CVPR. 2578-2587.","journal-title":"CVPR."},{"key":"e_1_3_2_1_10_1","first-page":"1602","article-title":"Usod10k: a new benchmark dataset for underwater salient object detection","volume":"34","author":"Hong Lin","year":"2025","unstructured":"Lin Hong, Xin Wang, Gan Zhang, and Ming Zhao. 2025. Usod10k: a new benchmark dataset for underwater salient object detection. IEEE TIP 34 (2025), 1602-1615.","journal-title":"IEEE TIP"},{"key":"e_1_3_2_1_11_1","volume-title":"Embedding fourier for ultra-high-definition low-light image enhancement. ICLR","author":"Li C","year":"2023","unstructured":"C Li, CL Guo, M Zhou, Z Liang, S Zhou, R Feng, and CC Loy. 2023. Embedding fourier for ultra-high-definition low-light image enhancement. ICLR (2023)."},{"key":"e_1_3_2_1_12_1","first-page":"6014","article-title":"Fourier Prior-Based Two-Stage Architecture for Image Restoration","author":"Nehete Hemkant","year":"2024","unstructured":"Hemkant Nehete, Amit Monga, Partha Kaushik, and Brajesh Kumar Kaushik. 2024. Fourier Prior-Based Two-Stage Architecture for Image Restoration. In CVPR. 6014-6023.","journal-title":"CVPR."},{"key":"e_1_3_2_1_13_1","first-page":"5886","article-title":"Efficient frequency domain-based transformers for high-quality image deblurring","author":"Kong Lingshun","year":"2023","unstructured":"Lingshun Kong, Jiangxin Dong, Jianjun Ge, Mingqiang Li, and Jinshan Pan. 2023. Efficient frequency domain-based transformers for high-quality image deblurring. In CVPR. 5886-5895.","journal-title":"CVPR."},{"key":"e_1_3_2_1_14_1","first-page":"1","article-title":"Lightweight Multi-Frequency Enhancement Network for RGB-D Video Salient Object Detection","author":"Suolang Daerji","year":"2025","unstructured":"Daerji Suolang, Jiahao He, Wangchuk Tsering, Keren Fu, Xiaofeng Li, and Qijun Zhao. 2025. Lightweight Multi-Frequency Enhancement Network for RGB-D Video Salient Object Detection. In ICASSP. 1-5.","journal-title":"ICASSP."},{"key":"e_1_3_2_1_15_1","first-page":"37","article-title":"Diffit: Diffusion vision transformers for image generation","author":"Hatamizadeh Ali","year":"2024","unstructured":"Ali Hatamizadeh, Jiaming Song, Guilin Liu, Jan Kautz, and Arash Vahdat. 2024. Diffit: Diffusion vision transformers for image generation. In ECCV. 37-55.","journal-title":"ECCV."},{"key":"e_1_3_2_1_16_1","first-page":"10157","article-title":"Shifted diffusion for text-to-image generation","author":"Zhou Yufan","year":"2023","unstructured":"Yufan Zhou, Bingchen Liu, Yizhe Zhu, Xiao Yang, Changyou Chen, and Jinhui Xu. 2023. Shifted diffusion for text-to-image generation. In CVPR. 10157-10166.","journal-title":"CVPR."},{"key":"e_1_3_2_1_17_1","first-page":"14235","article-title":"Conditional text image generation with diffusion models","author":"Zhu Yuanzhi","year":"2023","unstructured":"Yuanzhi Zhu, Zhaohai Li, Tianwei Wang, Mengchao He, and Cong Yao. 2023. Conditional text image generation with diffusion models. In CVPR. 14235-14245.","journal-title":"CVPR."},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2023.3261988"},{"key":"e_1_3_2_1_19_1","volume-title":"Moein Heidari, Reza Azad, Mohsen Fayyaz, Ilker Hacihaliloglu, and Dorit Merhof.","author":"Kazerouni Amirhossein","year":"2023","unstructured":"Amirhossein Kazerouni, Ehsan Khodapanah Aghdam, Moein Heidari, Reza Azad, Mohsen Fayyaz, Ilker Hacihaliloglu, and Dorit Merhof. 2023. Diffusion models in medical imaging: A comprehensive survey. Medical image analysis, Vol. 88 (2023), 102846."},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2024.3361474"},{"key":"e_1_3_2_1_21_1","volume-title":"SVAM: Saliency-guided visual attention modeling by autonomous underwater robots.","author":"Islam Md Jahidul","year":"2022","unstructured":"Md Jahidul Islam, Ruobing Wang, and Junaed Sattar. 2022. SVAM: Saliency-guided visual attention modeling by autonomous underwater robots. (2022)."},{"key":"e_1_3_2_1_22_1","first-page":"6800","article-title":"CIR-Net: Cross-modality interaction and refinement for RGB-D salient object detection","volume":"31","author":"Cong Runmin","year":"2022","unstructured":"Runmin Cong, Qinwei Lin, Chen Zhang, Chongyi Li, Xiaochun Cao, Qingming Huang, and Yao Zhao. 2022. CIR-Net: Cross-modality interaction and refinement for RGB-D salient object detection. IEEE TIP 31 (2022), 6800-6815.","journal-title":"IEEE TIP"},{"key":"e_1_3_2_1_23_1","first-page":"2332","article-title":"Boosting salient object detection with transformer-based asymmetric bilateral U-Net","volume":"34","author":"Qiu Yu","year":"2023","unstructured":"Yu Qiu, Yun Liu, Le Zhang, Haotian Lu, and Jing Xu. 2023. Boosting salient object detection with transformer-based asymmetric bilateral U-Net. IEEE TCSVT 34, 4 (2023), 2332-2345.","journal-title":"IEEE TCSVT"},{"key":"e_1_3_2_1_24_1","first-page":"2160","article-title":"Hidanet: Rgb-d salient object detection via hierarchical depth awareness","volume":"32","author":"Allibert Guillaume","year":"2023","unstructured":"ongwei Wu, Guillaume Allibert, Fabrice Meriaudeau, Chao Ma, and C\u00e9dric Demonceaux. 2023. Hidanet: Rgb-d salient object detection via hierarchical depth awareness. IEEE TIP 32 (2023), 2160-2173.","journal-title":"IEEE TIP"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2024.3388153"},{"key":"e_1_3_2_1_26_1","first-page":"9048","article-title":"CoDi: conditional diffusion distillation for higher-fidelity and faster image generation","author":"Mei Kangfu","year":"2024","unstructured":"Kangfu Mei, Mauricio Delbracio, Hossein Talebi, Zhengzhong Tu, Vishal M Patel, and Peyman Milanfar. 2024. CoDi: conditional diffusion distillation for higher-fidelity and faster image generation. In CVPR. 9048-9058.","journal-title":"CVPR."},{"key":"e_1_3_2_1_27_1","first-page":"3836","article-title":"Adding conditional control to text-to-image diffusion models","author":"Zhang Lvmin","year":"2023","unstructured":"Lvmin Zhang, Anyi Rao, and Maneesh Agrawala. 2023. Adding conditional control to text-to-image diffusion models. In ICCV. 3836-3847.","journal-title":"ICCV."},{"key":"e_1_3_2_1_28_1","unstructured":"Junde Wu Wei Ji Huazhu Fu Min Xu Yueming Jin and Yanwu Xu. 2024. Medsegdiff-v2: Diffusion-based medical image segmentation with transformer. In AAAI."},{"key":"e_1_3_2_1_29_1","first-page":"1623","article-title":"Medsegdiff: Medical image segmentation with diffusion probabilistic model","author":"Wu Junde","year":"2024","unstructured":"Junde Wu, Rao Fu, Huihui Fang, Yu Zhang, Yehui Yang, Haoyi Xiong, Huiying Liu, and Yanwu Xu. 2024. Medsegdiff: Medical image segmentation with diffusion probabilistic model. In Medical Imaging with Deep Learning. 1623-1639.","journal-title":"Medical Imaging with Deep Learning."},{"key":"e_1_3_2_1_30_1","first-page":"7345","article-title":"Conditional diffusion for interactive segmentation","author":"Chen Xi","year":"2021","unstructured":"Xi Chen, Zhiyan Zhao, Feiwu Yu, Yilei Zhang, and Manni Duan. 2021. Conditional diffusion for interactive segmentation. In ICCV. 7345-7354.","journal-title":"ICCV."},{"key":"e_1_3_2_1_31_1","first-page":"22445","article-title":"Dire for diffusion-generated image detection","author":"Wang Zhendong","year":"2023","unstructured":"Zhendong Wang, Jianmin Bao, Wengang Zhou, Weilun Wang, Hezhen Hu, Hong Chen, and Houqiang Li. 2023. Dire for diffusion-generated image detection. In ICCV. 22445-22455.","journal-title":"ICCV."},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i2.27890"},{"key":"e_1_3_2_1_33_1","volume-title":"So Kweon, and Yanning Zhang. 2024","author":"Niu Axi","year":"2024","unstructured":"Axi Niu, Trung X Pham, Kang Zhang, Jinqiu Sun, Yu Zhu, Qingsen Yan, In So Kweon, and Yanning Zhang. 2024. ACDMSR: Accelerated conditional diffusion models for single image super-resolution. IEEE Transactions on Broadcasting (2024)."},{"key":"e_1_3_2_1_34_1","first-page":"10021","article-title":"Implicit diffusion models for continuous super-resolution","author":"Gao Sicheng","year":"2023","unstructured":"Sicheng Gao, Xuhui Liu, Bohan Zeng, Sheng Xu, Yanjing Li, Xiaoyan Luo, Jianzhuang Liu, Xiantong Zhen, and Baochang Zhang. 2023. Implicit diffusion models for continuous super-resolution. In CVPR. 10021-10030.","journal-title":"CVPR."},{"key":"e_1_3_2_1_35_1","volume-title":"Diffusion models, image super-resolution, and everything: A survey","author":"Moser Brian B","year":"2024","unstructured":"Brian B Moser, Arundhati S Shanbhag, Federico Raue, Stanislav Frolov, Sebastian Palacio, and Andreas Dengel. 2024. Diffusion models, image super-resolution, and everything: A survey. IEEE Transactions on Neural Networks and Learning Systems (2024), 1-21."},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1007\/s41095-022-0274-8"},{"key":"e_1_3_2_1_37_1","first-page":"110328","article-title":"Separate first, then segment: An integrity segmentation network for salient object detection","volume":"150","author":"Zhu Ge","year":"2024","unstructured":"Ge Zhu, Jinbao Li, and Yahong Guo. 2024. Separate first, then segment: An integrity segmentation network for salient object detection. PR 150 (2024), 110328.","journal-title":"PR"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2024.3469286"},{"key":"e_1_3_2_1_39_1","volume-title":"Attention is all you need. NIPS 30","author":"Vaswani Ashish","year":"2017","unstructured":"Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan N Gomez, Lukasz Kaiser, and Illia Polosukhin. 2017. Attention is all you need. NIPS 30 (2017)."},{"key":"e_1_3_2_1_40_1","first-page":"6840","article-title":"Denoising diffusion probabilistic models","volume":"33","author":"Ho Jonathan","year":"2020","unstructured":"Jonathan Ho, Ajay Jain, and Pieter Abbeel. 2020. Denoising diffusion probabilistic models. NIPS 33 (2020), 6840-6851.","journal-title":"NIPS"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-50835-1_22"},{"key":"e_1_3_2_1_42_1","first-page":"9026","volume-title":"IEEE TPAMI","volume":"44","author":"Liu Nian","year":"2021","unstructured":"Nian Liu, Ni Zhang, Ling Shao, and Junwei Han. 2021. Learning selective mutual attention and contrast for RGB-D saliency detection. IEEE TPAMI, Vol. 44, 12 (2021), 9026-9042."},{"key":"e_1_3_2_1_43_1","first-page":"13756","article-title":"Learning selective self-mutual attention for RGB-D saliency detection","author":"Liu Nian","year":"2020","unstructured":"Nian Liu, Ni Zhang, and Junwei Han. 2020. Learning selective self-mutual attention for RGB-D saliency detection. In CVPR. 13756-13765.","journal-title":"CVPR."},{"key":"e_1_3_2_1_44_1","first-page":"8727","article-title":"Bifurcated Backbone Strategy for RGB-D Salient Object Detection","volume":"30","author":"Zhai Yingjie","year":"2021","unstructured":"Yingjie Zhai, Deng-Ping Fan, Jufeng Yang, Ali Borji, Ling Shao, Junwei Han, and Liang Wang. 2021. Bifurcated Backbone Strategy for RGB-D Salient Object Detection. IEEE TIP, Vol. 30 (2021), 8727-8742.","journal-title":"IEEE TIP"},{"key":"e_1_3_2_1_45_1","first-page":"2094","article-title":"Cross-modality discrepant interaction network for RGB-D salient object detection","author":"Zhang Chen","year":"2021","unstructured":"Chen Zhang, Runmin Cong, Qinwei Lin, Lin Ma, Feng Li, Yao Zhao, and Sam Kwong. 2021. Cross-modality discrepant interaction network for RGB-D salient object detection. In ACM MM. 2094-2102.","journal-title":"ACM MM."},{"key":"e_1_3_2_1_46_1","first-page":"406","article-title":"Point-aware interaction and cnn-induced refinement network for RGB-D salient object detection","author":"Cong Runmin","year":"2023","unstructured":"Runmin Cong, Hongyu Liu, Chen Zhang, Wei Zhang, Feng Zheng, Ran Song, and Sam Kwong. 2023. Point-aware interaction and cnn-induced refinement network for RGB-D salient object detection. In ACM MM. 406-416.","journal-title":"ACM MM."},{"key":"e_1_3_2_1_47_1","first-page":"2249","volume-title":"IEEE TMM","volume":"26","author":"Sun Fuming","year":"2023","unstructured":"Fuming Sun, Peng Ren, Bowen Yin, Fasheng Wang, and Haojie Li. 2023. CATNet: A cascaded and aggregated transformer network for RGB-D salient object detection. IEEE TMM, Vol. 26 (2023), 2249-2262."},{"key":"e_1_3_2_1_48_1","first-page":"5257","article-title":"Salient object detection in optical remote sensing images driven by transformer","volume":"32","author":"Li Gongyang","year":"2023","unstructured":"Gongyang Li, Zhen Bai, Zhi Liu, Xinpeng Zhang, and Haibin Ling. 2023. Salient object detection in optical remote sensing images driven by transformer. IEEE TIP, Vol. 32 (2023), 5257-5269.","journal-title":"IEEE TIP"},{"key":"e_1_3_2_1_49_1","first-page":"3212","article-title":"Quality-aware selective fusion network for VDT salient object detection","volume":"33","author":"Bao Liuxin","year":"2024","unstructured":"Liuxin Bao, Xiaofei Zhou, Xiankai Lu, Yaoqi Sun, Haibing Yin, Zhenghui Hu, Jiyong Zhang, and Chenggang Yan. 2024. Quality-aware selective fusion network for VDT salient object detection. IEEE TIP 33 (2024), 3212-3226.","journal-title":"IEEE TIP"},{"key":"e_1_3_2_1_50_1","first-page":"10692","article-title":"Alignment-free rgbt salient object detection: Semantics-guided asymmetric correlation network and a unified benchmark","volume":"26","author":"Wang Kunpeng","year":"2024","unstructured":"Kunpeng Wang, Danying Lin, Chenglong Li, Zhengzheng Tu, and Bin Luo. 2024. Alignment-free rgbt salient object detection: Semantics-guided asymmetric correlation network and a unified benchmark. IEEE TMM 26 (2024), 10692-10707.","journal-title":"IEEE TMM"},{"key":"e_1_3_2_1_51_1","first-page":"28170","article-title":"CoralSCOP: segment any coral image on this planet","author":"Zheng Ziqiang","year":"2024","unstructured":"Ziqiang Zheng, Haixin Liang, Binh-Son Hua, Yue Him Wong, Put Ang, Apple Pui Yi Chui, and Sai-Kit Yeung. 2024. CoralSCOP: segment any coral image on this planet. In CVPR. 28170-28180.","journal-title":"CVPR."},{"key":"e_1_3_2_1_52_1","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2024.3491907"},{"key":"e_1_3_2_1_53_1","first-page":"608","article-title":"A simple yet effective network based on vision transformer for camouflaged object and salient object detection","volume":"34","author":"Hao Chao","year":"2025","unstructured":"Chao Hao, Zitong Yu, Xin Liu, Jun Xu, Huanjing Yue, and Jingyu Yang. 2025. A simple yet effective network based on vision transformer for camouflaged object and salient object detection. IEEE TIP, Vol. 34 (2025), 608-622.","journal-title":"IEEE TIP"}],"event":{"name":"MM '25: The 33rd ACM International Conference on Multimedia","location":"Dublin Ireland","acronym":"MM '25","sponsor":["SIGMM ACM Special Interest Group on Multimedia"]},"container-title":["Proceedings of the 33rd ACM International Conference on Multimedia"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3746027.3755467","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,9]],"date-time":"2025-12-09T19:22:20Z","timestamp":1765308140000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3746027.3755467"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,27]]},"references-count":53,"alternative-id":["10.1145\/3746027.3755467","10.1145\/3746027"],"URL":"https:\/\/doi.org\/10.1145\/3746027.3755467","relation":{},"subject":[],"published":{"date-parts":[[2025,10,27]]},"assertion":[{"value":"2025-10-27","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}