{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T17:12:46Z","timestamp":1777655566673,"version":"3.51.4"},"publisher-location":"New York, NY, USA","reference-count":68,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,10,28]],"date-time":"2024-10-28T00:00:00Z","timestamp":1730073600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,10,28]]},"DOI":"10.1145\/3664647.3680888","type":"proceedings-article","created":{"date-parts":[[2024,10,26]],"date-time":"2024-10-26T06:59:33Z","timestamp":1729925973000},"page":"10382-10391","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":36,"title":["LoFormer: Local Frequency Transformer for Image Deblurring"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0002-3129-2723","authenticated-orcid":false,"given":"Xintian","family":"Mao","sequence":"first","affiliation":[{"name":"Shanghai Key Laboratory of Multidimensional Information Processing, East China Normal University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5724-5357","authenticated-orcid":false,"given":"Jiansheng","family":"Wang","sequence":"additional","affiliation":[{"name":"Shanghai Key Laboratory of Multidimensional Information Processing, East China Normal University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-1449-1852","authenticated-orcid":false,"given":"Xingran","family":"Xie","sequence":"additional","affiliation":[{"name":"Shanghai Key Laboratory of Multidimensional Information Processing, East China Normal University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5063-8801","authenticated-orcid":false,"given":"Qingli","family":"Li","sequence":"additional","affiliation":[{"name":"Shanghai Key Laboratory of Multidimensional Information Processing, East China Normal University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1592-9627","authenticated-orcid":false,"given":"Yan","family":"Wang","sequence":"additional","affiliation":[{"name":"Shanghai Key Laboratory of Multidimensional Information Processing, East China Normal University, Shanghai, China"}]}],"member":"320","published-online":{"date-parts":[[2024,10,28]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Jamie Ryan Kiros, and Geoffrey E. Hinton","author":"Ba Lei Jimmy","year":"2016","unstructured":"Lei Jimmy Ba, Jamie Ryan Kiros, and Geoffrey E. Hinton. 2016. Layer Normalization. CoRR, Vol. abs\/1607.06450 (2016)."},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01212"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20071-7_2"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW53098.2021.00027"},{"key":"e_1_3_2_1_6_1","unstructured":"Mark Chen Alec Radford Rewon Child Jeffrey Wu Heewoo Jun David Luan and Ilya Sutskever. 2020. Generative Pretraining From Pixels. In Proc? ICML. 1691--1703."},{"key":"e_1_3_2_1_7_1","volume-title":"Proc. NeurIPS, Hugo Larochelle, Marc'Aurelio Ranzato, Raia Hadsell, Maria-Florina Balcan, and Hsuan-Tien Lin (Eds.).","author":"Chi Lu","year":"2020","unstructured":"Lu Chi, Borui Jiang, and Yadong Mu. 2020. Fast Fourier Convolution. In Proc. NeurIPS, Hugo Larochelle, Marc'Aurelio Ranzato, Raia Hadsell, Maria-Florina Balcan, and Hsuan-Tien Lin (Eds.)."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00460"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20071-7_4"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01195"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01134"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/3581783.3611976"},{"key":"e_1_3_2_1_14_1","volume-title":"Proc. ICLR.","author":"Dosovitskiy Alexey","year":"2020","unstructured":"Alexey Dosovitskiy, Lucas Beyer, Alexander Kolesnikov, Dirk Weissenborn, Xiaohua Zhai, Thomas Unterthiner, Mostafa Dehghani, Matthias Minderer, Georg Heigold, Sylvain Gelly, et al. 2020. An Image is Worth 16x16 Words: Transformers for Image Recognition at Scale. In Proc. ICLR."},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01736"},{"key":"e_1_3_2_1_16_1","volume-title":"Learning Enriched Features via Selective State Spaces Model for Efficient Image Deblurring. arXiv preprint arXiv:2403.20106","author":"Gao Hu","year":"2024","unstructured":"Hu Gao and Depeng Dang. 2024. Learning Enriched Features via Selective State Spaces Model for Efficient Image Deblurring. arXiv preprint arXiv:2403.20106 (2024)."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46448-0_38"},{"key":"e_1_3_2_1_18_1","volume-title":"Spatially-Variant Degradation Model for Dataset-free Super-resolution. arXiv preprint arXiv:2407.08252","author":"Guo Shaojie","year":"2024","unstructured":"Shaojie Guo, Haofei Song, Qingli Li, and Yan Wang. 2024. Spatially-Variant Degradation Model for Dataset-free Super-resolution. arXiv preprint arXiv:2407.08252 (2024)."},{"key":"e_1_3_2_1_19_1","volume-title":"Learning shared semantic space for speech-to-text translation. arXiv preprint arXiv:2105.03095","author":"Han Chi","year":"2021","unstructured":"Chi Han, Mingxuan Wang, Heng Ji, and Lei Li. 2021. Learning shared semantic space for speech-to-text translation. arXiv preprint arXiv:2105.03095 (2021)."},{"key":"e_1_3_2_1_20_1","unstructured":"Ronghang Hu Amanpreet Singh Trevor Darrell and Marcus Rohrbach. 2020. Iterative Answer Prediction With Pointer-Augmented Multimodal Transformers for TextVQA. In Proc?CVPR."},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02445"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02358"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00570"},{"key":"e_1_3_2_1_24_1","volume-title":"Efficient Visual State Space Model for Image Deblurring. arXiv preprint arXiv:2405.14343","author":"Kong Lingshun","year":"2024","unstructured":"Lingshun Kong, Jiangxin Dong, Ming-Hsuan Yang, and Jinshan Pan. 2024. Efficient Visual State Space Model for Image Deblurring. arXiv preprint arXiv:2405.14343 (2024)."},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00854"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00897"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01150"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW54120.2021.00210"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02418"},{"key":"e_1_3_2_1_30_1","volume-title":"Swin Transformer: Hierarchical Vision Transformer using Shifted Windows. In Proc?ICCV.","author":"Liu Ze","year":"2021","unstructured":"Ze Liu, Yutong Lin, Yue Cao, Han Hu, Yixuan Wei, Zheng Zhang, Stephen Lin, and Baining Guo. 2021. Swin Transformer: Hierarchical Vision Transformer using Shifted Windows. In Proc?ICCV."},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"e_1_3_2_1_32_1","volume-title":"Proc. ICLR.","author":"Loshchilov Ilya","year":"2017","unstructured":"Ilya Loshchilov and Frank Hutter. 2017. SGDR: Stochastic Gradient Descent with Warm Restarts. In Proc. ICLR."},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02398"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02426"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i2.25281"},{"key":"e_1_3_2_1_36_1","volume-title":"Reduction of JPEG compression artifacts based on DCT coefficients prediction. Neurocomputing","author":"Mengdi Sun","year":"2020","unstructured":"Sun Mengdi, Xiaohai He, Xiong Shuhua, Chao Ren, and Li Xinglong. 2020. Reduction of JPEG compression artifacts based on DCT coefficients prediction. Neurocomputing (2020)."},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.35"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW53098.2021.00025"},{"key":"e_1_3_2_1_39_1","volume-title":"Proc. ICCV.","author":"Qin Zequn","year":"2020","unstructured":"Zequn Qin, Pengyi Zhang, Fei Wu, and Xi Li. 2020. FcaNet: Frequency Channel Attention Networks. In Proc. ICCV."},{"key":"e_1_3_2_1_40_1","volume-title":"Proc. NeurIPS.","author":"Rao Yongming","year":"2021","unstructured":"Yongming Rao, Wenliang Zhao, Zheng Zhu, Jiwen Lu, and Jie Zhou. 2021. Global Filter Networks for Image Classification. In Proc. NeurIPS."},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58595-2_12"},{"key":"e_1_3_2_1_42_1","volume-title":"Adams","author":"Rippel Oren","year":"2015","unstructured":"Oren Rippel, Jasper Snoek, and Ryan P. Adams. 2015. Spectral Representations for Convolutional Neural Networks. In Proc. NeurIPS."},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-24574-4_28"},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.1109\/WACV48630.2021.00331"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2023.3333238"},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00567"},{"key":"e_1_3_2_1_47_1","volume-title":"I 3 Net: Inter-Intra-slice Interpolation Network for Medical Slice Synthesis","author":"Song Haofei","year":"2024","unstructured":"Haofei Song, Xintian Mao, Jing Yu, Qingli Li, and Yan Wang. 2024. I 3 Net: Inter-Intra-slice Interpolation Network for Medical Slice Synthesis. IEEE Transactions on Medical Imaging (2024)."},{"key":"e_1_3_2_1_48_1","volume-title":"Proc. ICLR.","author":"Su Weijie","year":"2020","unstructured":"Weijie Su, Xizhou Zhu, Yue Cao, Bin Li, Lewei Lu, Furu Wei, and Jifeng Dai. 2020. VL-BERT: Pre-training of Generic Visual-Linguistic Representations. In Proc. ICLR."},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00756"},{"key":"e_1_3_2_1_50_1","doi-asserted-by":"publisher","DOI":"10.1109\/WACV51458.2022.00323"},{"key":"e_1_3_2_1_51_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00853"},{"key":"e_1_3_2_1_52_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19800-7_9"},{"key":"e_1_3_2_1_53_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00568"},{"key":"e_1_3_2_1_54_1","volume-title":"Proc. NeurIPS.","author":"Vaswani Ashish","year":"2017","unstructured":"Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan N Gomez, \u0141ukasz Kaiser, and Illia Polosukhin. 2017. Attention is all you need. In Proc. NeurIPS."},{"key":"e_1_3_2_1_55_1","doi-asserted-by":"publisher","DOI":"10.2737\/FPL-GTR-290"},{"key":"e_1_3_2_1_56_1","doi-asserted-by":"publisher","DOI":"10.2737\/FPL-GTR-290"},{"key":"e_1_3_2_1_57_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00427"},{"key":"e_1_3_2_1_58_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00414"},{"key":"e_1_3_2_1_59_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19806-9_19"},{"key":"e_1_3_2_1_60_1","volume-title":"Proc. NeurIPS.","author":"Yu Hu","year":"2022","unstructured":"Hu Yu, Jie Huang, Feng Zhao, Jinwei Gu, Chen Change Loy, Deyu Meng, Chongyi Li, et al. 2022. Deep Fourier Up-Sampling. In Proc. NeurIPS."},{"key":"e_1_3_2_1_61_1","doi-asserted-by":"publisher","DOI":"10.1145\/3581783.3612335"},{"key":"e_1_3_2_1_62_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00564"},{"key":"e_1_3_2_1_63_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01458"},{"key":"e_1_3_2_1_64_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00613"},{"key":"e_1_3_2_1_65_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00281"},{"key":"e_1_3_2_1_66_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2021.3115139"},{"key":"e_1_3_2_1_67_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00446"},{"key":"e_1_3_2_1_68_1","volume-title":"Proc. NeurIPS.","author":"Zhong Zhisheng","year":"2018","unstructured":"Zhisheng Zhong, Tiancheng Shen, Yibo Yang, Zhouchen Lin, and Chao Zhang. 2018. Joint Sub-bands Learning with Clique Structures for Wavelet Domain Super-Resolution. In Proc. NeurIPS."}],"event":{"name":"MM '24: The 32nd ACM International Conference on Multimedia","location":"Melbourne VIC Australia","acronym":"MM '24","sponsor":["SIGMM ACM Special Interest Group on Multimedia"]},"container-title":["Proceedings of the 32nd ACM International Conference on Multimedia"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3664647.3680888","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3664647.3680888","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T01:17:33Z","timestamp":1750295853000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3664647.3680888"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,10,28]]},"references-count":68,"alternative-id":["10.1145\/3664647.3680888","10.1145\/3664647"],"URL":"https:\/\/doi.org\/10.1145\/3664647.3680888","relation":{},"subject":[],"published":{"date-parts":[[2024,10,28]]},"assertion":[{"value":"2024-10-28","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}