{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,11]],"date-time":"2026-03-11T16:56:37Z","timestamp":1773248197509,"version":"3.50.1"},"reference-count":70,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"Major Science and Technology Innovation 2030"},{"name":"New Generation Artificial Intelligence&#x201D; Key Project","award":["2021ZD0111700"],"award-info":[{"award-number":["2021ZD0111700"]}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62336003"],"award-info":[{"award-number":["62336003"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["12371510"],"award-info":[{"award-number":["12371510"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62172354"],"award-info":[{"award-number":["62172354"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62076005"],"award-info":[{"award-number":["62076005"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"NSF of Jiangsu Province","award":["BZ2021013"],"award-info":[{"award-number":["BZ2021013"]}]},{"name":"NSF for Distinguished Young Scholar of Jiangsu Province","award":["BK20220080"],"award-info":[{"award-number":["BK20220080"]}]},{"name":"Dreams Foundation of Jianghuai Advance Technology Center","award":["2023-ZM01Z015"],"award-info":[{"award-number":["2023-ZM01Z015"]}]},{"name":"Yunling Scholar Talent Program of Yunnan Province","award":["K264202230207"],"award-info":[{"award-number":["K264202230207"]}]},{"name":"Yunnan Dengcheng Expert Workstation","award":["202305AF150202"],"award-info":[{"award-number":["202305AF150202"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Multimedia"],"published-print":{"date-parts":[[2025]]},"DOI":"10.1109\/tmm.2025.3535387","type":"journal-article","created":{"date-parts":[[2025,1,28]],"date-time":"2025-01-28T18:44:24Z","timestamp":1738089864000},"page":"3251-3265","source":"Crossref","is-referenced-by-count":6,"title":["SpliceMix: A Cross-Scale and Semantic Blending Augmentation Strategy for Multi-Label Image Classification"],"prefix":"10.1109","volume":"27","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-3860-5139","authenticated-orcid":false,"given":"Lei","family":"Wang","sequence":"first","affiliation":[{"name":"Key Laboratory of Intelligent Perception and Systems for High-Dimensional Information of Ministry of Education, Jiangsu Key Laboratory of Image and Video Understanding for Social Security, School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, Jiangsu, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3180-0484","authenticated-orcid":false,"given":"Yibing","family":"Zhan","sequence":"additional","affiliation":[{"name":"JD Explore Academy, Beijing, China"}]},{"given":"Leilei","family":"Ma","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, Anhui University, Heifei, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0783-5273","authenticated-orcid":false,"given":"Dapeng","family":"Tao","sequence":"additional","affiliation":[{"name":"FIST LAB, School of Information Science and Engineering, Yunnan University, Kunming, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8976-2084","authenticated-orcid":false,"given":"Liang","family":"Ding","sequence":"additional","affiliation":[{"name":"JD Explore Academy, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4092-9856","authenticated-orcid":false,"given":"Chen","family":"Gong","sequence":"additional","affiliation":[{"name":"Key Laboratory of Intelligent Perception and Systems for High-Dimensional Information of Ministry of Education, Jiangsu Key Laboratory of Image and Video Understanding for Social Security, School of Computer Science and Engineering, Nanjing University of Science and Technology, Nanjing, Jiangsu, China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref2","first-page":"7588","article-title":"Neural architecture search without training","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Mellor","year":"2021"},{"key":"ref3","first-page":"2866","article-title":"Mixup: Beyond empirical risk minimization","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Zhang","year":"2018"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2023.3326300"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01553"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2023.3237166"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00025"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01242"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6964"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00612"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00815"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58589-1_39"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00532"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01621"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2022.3171095"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2023.3277279"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01108"},{"key":"ref18","first-page":"5275","article-title":"Puzzle mix: Exploiting saliency and local statistics for optimal mixup","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Kim","year":"2020"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19809-0_26"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/WACV48630.2021.00141"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00692"},{"key":"ref22","first-page":"1","article-title":"Saliencymix: A saliency guided data augmentation strategy for better regularization","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Uddin","year":"2021"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.219"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v32i1.12281"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2021.3088605"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1145\/3503161.3547834"},{"key":"ref27","article-title":"Recurrent neural network regularization","author":"Zaremba","year":"2014"},{"key":"ref28","first-page":"2713","article-title":"Semi-supervised classification with graph convolutional networks","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Kipf","year":"2017"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.251"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00861"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00061"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00023"},{"key":"ref34","article-title":"Query2label: A simple transformer way to multi-label classification","author":"Liu","year":"2021"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1145\/3503161.3548343"},{"key":"ref36","first-page":"1","article-title":"Causality compensated attention for contextual biased visual recognition","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Liu","year":"2023"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00840"},{"key":"ref38","article-title":"Improved regularization of convolutional neural networks with cutout","author":"DeVries","year":"2017"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW50498.2020.00386"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9053994"},{"key":"ref41","article-title":"Drawing multiple augmentation samples per image during training efficiently decreases test error","author":"Fort","year":"2021"},{"key":"ref42","first-page":"8026","article-title":"Pytorch: An imperative style, high-performance deep learning library","volume-title":"Proc. 33rd Int. Conf. Neural Inf. Process. Syst.","author":"Paszke","year":"2019"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00454"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01165"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i8.16865"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-021-01453-z"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00015"},{"key":"ref48","article-title":"Distilling the knowledge in a neural network","author":"Hinton","year":"2015"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01167"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1804.02767"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-009-0275-4"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i4.16472"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2022.3148867"},{"key":"ref55","article-title":"Resizemix: Mixing data with preserved object information and true labels","author":"Qin","year":"2020"},{"key":"ref56","first-page":"8427","article-title":"Recursivemix: Mixed learning with history","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Yang","year":"2022"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i1.19910"},{"key":"ref59","article-title":"Simple and robust loss design for multi-label learning with missing labels","author":"Zhang","year":"2021"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00099"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.324"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01264-9_8"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2010.11929"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00088"},{"key":"ref66","article-title":"ImageNet-21k pretraining for the masses","author":"Ridnik","year":"2021"},{"key":"ref67","article-title":"Fixing the train-test resolution discrepancy","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Touvron","year":"2019"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00132"},{"key":"ref69","article-title":"[Re] don\u2019t judge an object by its context: Learning to overcome contextual bias","author":"Kim","year":"2021"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.319"}],"container-title":["IEEE Transactions on Multimedia"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/6046\/10844992\/10856374.pdf?arnumber=10856374","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,12]],"date-time":"2025-06-12T17:43:42Z","timestamp":1749750222000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10856374\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"references-count":70,"URL":"https:\/\/doi.org\/10.1109\/tmm.2025.3535387","relation":{},"ISSN":["1520-9210","1941-0077"],"issn-type":[{"value":"1520-9210","type":"print"},{"value":"1941-0077","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025]]}}}