{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,28]],"date-time":"2026-02-28T18:35:28Z","timestamp":1772303728447,"version":"3.50.1"},"reference-count":82,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"12","license":[{"start":{"date-parts":[[2023,12,1]],"date-time":"2023-12-01T00:00:00Z","timestamp":1701388800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2023,12,1]],"date-time":"2023-12-01T00:00:00Z","timestamp":1701388800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,12,1]],"date-time":"2023-12-01T00:00:00Z","timestamp":1701388800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"National Key R &amp; D Program of China","award":["2022ZD0116500"],"award-info":[{"award-number":["2022ZD0116500"]}]},{"name":"Shanghai Committee of Science and Technology","award":["21DZ1100100"],"award-info":[{"award-number":["21DZ1100100"]}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61836014"],"award-info":[{"award-number":["61836014"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["U21B2042"],"award-info":[{"award-number":["U21B2042"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62006231"],"award-info":[{"award-number":["62006231"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62072457"],"award-info":[{"award-number":["62072457"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Pattern Anal. Mach. Intell."],"published-print":{"date-parts":[[2023,12]]},"DOI":"10.1109\/tpami.2023.3301302","type":"journal-article","created":{"date-parts":[[2023,8,2]],"date-time":"2023-08-02T17:43:47Z","timestamp":1690998227000},"page":"15996-16012","source":"Crossref","is-referenced-by-count":18,"title":["Weakly Supervised Semantic Segmentation via Box-Driven Masking and Filling Rate Shifting"],"prefix":"10.1109","volume":"45","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-1223-3242","authenticated-orcid":false,"given":"Chunfeng","family":"Song","sequence":"first","affiliation":[{"name":"Center for Research on Intelligent Perception and Computing (CRIPAC), National Laboratory of Pattern Recognition (NLPR), State Key Laboratory of Multimodal Artificial Intelligence Systems (MAIS), Institute of Automation, Chinese Academy of Sciences (CASIA), Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9163-2761","authenticated-orcid":false,"given":"Wanli","family":"Ouyang","sequence":"additional","affiliation":[{"name":"Shanghai Artificial Intelligence Laboratory, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2648-3875","authenticated-orcid":false,"given":"Zhaoxiang","family":"Zhang","sequence":"additional","affiliation":[{"name":"Center for Research on Intelligent Perception and Computing (CRIPAC), National Laboratory of Pattern Recognition (NLPR), State Key Laboratory of Multimodal Artificial Intelligence Systems (MAIS), Institute of Automation, Chinese Academy of Sciences (CASIA), University of Chinese Academy of Sciences (UCAS), Beijing, China"}]}],"member":"263","reference":[{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46466-4_32"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00307"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1145\/1015706.1015720"},{"key":"ref15","first-page":"675","article-title":"PAD-Net: Multi-tasks guided prediction-and-distillation network for simultaneous depth estimation and scene parsing","author":"dan","year":"2018","journal-title":"Proc IEEE Conf Comput Vis Pattern Recognit"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00129"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.191"},{"key":"ref58","article-title":"Very deep convolutional networks for large-scale image recognition","author":"simonyan","year":"2014"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1145\/3240508.3240542"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2537320"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00425"},{"key":"ref55","article-title":"Faster R-CNN: Towards real-time object detection with region proposal networks","author":"ren","year":"2015","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref10","first-page":"801","article-title":"Encoder-decoder with atrous separable convolution for semantic image segmentation","author":"chen","year":"2018","journal-title":"Proc Eur Conf Comput Vis"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2019.2901393"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-014-0733-5"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00254"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01240-3_23"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6705"},{"key":"ref51","first-page":"1990","article-title":"Learning to segment object candidates","author":"pinheiro","year":"2015","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref50","first-page":"82","article-title":"Recurrent convolutional neural networks for scene labeling","author":"pinheiro","year":"2014","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref46","first-page":"507","article-title":"On regularized losses for weakly-supervised CNN segmentation","author":"meng","year":"2018","journal-title":"Proc Eur Conf Comput Vis"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58558-7_46"},{"key":"ref48","first-page":"1742","article-title":"Weakly-and semi-supervised learning of a deep convolutional network for semantic image segmentation","author":"papandreou","year":"2015","journal-title":"Proc IEEE Int Conf Comput Vis"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00684"},{"key":"ref42","first-page":"740","article-title":"Microsoft COCO: Common objects in context","author":"lin","year":"2014","journal-title":"Proc Eur Conf Comput Vis"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.348"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.3023152"},{"key":"ref49","article-title":"Usage: A unified seed area generation paradigm for weakly supervised semantic segmentation","author":"peng","year":"2023"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2017.2699184"},{"key":"ref7","article-title":"Semantic image segmentation with deep convolutional nets and fully connected CRFs","author":"chen","year":"2015","journal-title":"Proc Int Conf Learn Representations"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.396"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00684"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46478-7_34"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.667"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00511"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00399"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.319"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.344"},{"key":"ref80","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.179"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00267"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00747"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00406"},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00715"},{"key":"ref37","first-page":"102","article-title":"Weakly-and semi-supervised panoptic segmentation","author":"li","year":"2018","journal-title":"Proc Eur Conf Comput Vis"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00545"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58583-9_18"},{"key":"ref75","article-title":"Multi-scale context aggregation by dilated convolutions","author":"yu","year":"2018"},{"key":"ref30","first-page":"109","article-title":"Efficient inference in fully connected CRFs with Gaussian edge potentials","author":"kr\u00e4henb\u00fchl","year":"2011","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref74","first-page":"2048","article-title":"Show, attend and tell: Neural image caption generation with visual attention","author":"xu","year":"2015","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00541"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2021.3083269"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00126"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58539-6_11"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00523"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00231"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2820063"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19818-2_1"},{"key":"ref71","article-title":"Learning class-agnostic pseudo mask generation for box-supervised semantic segmentation","author":"xie","year":"2021"},{"key":"ref70","first-page":"418","article-title":"Unified perceptual parsing for scene understanding","author":"xiao","year":"2018","journal-title":"Proc Eur Conf Comput Vis"},{"key":"ref73","article-title":"Learning deep structured multi-scale features using attention-gated CRFs for contour prediction","author":"xu","year":"2017","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref72","first-page":"12077","article-title":"SegFormer: Simple and efficient design for semantic segmentation with transformers","author":"xie","year":"2021","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref24","article-title":"Self-erasing network for integral object attention","author":"hou","year":"2018","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00759"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00147"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00069"},{"key":"ref25","article-title":"Weakly supervised instance segmentation using the bounding box tightness prior","author":"hsu","year":"2019","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2019.01.006"},{"key":"ref20","article-title":"Attentional network for visual object detection","author":"hara","year":"2017"},{"key":"ref64","first-page":"577","article-title":"Constrained k-means clustering with background knowledge","author":"wagstaff","year":"2001","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.315"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.322"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-020-01293-3"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2011.6126343"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.2983686"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/2647868.2654889"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00733"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.181"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00325"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.3013717"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00540"}],"container-title":["IEEE Transactions on Pattern Analysis and Machine Intelligence"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/34\/10308548\/10202580.pdf?arnumber=10202580","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,11,27]],"date-time":"2023-11-27T19:54:44Z","timestamp":1701114884000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10202580\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,12]]},"references-count":82,"journal-issue":{"issue":"12"},"URL":"https:\/\/doi.org\/10.1109\/tpami.2023.3301302","relation":{},"ISSN":["0162-8828","2160-9292","1939-3539"],"issn-type":[{"value":"0162-8828","type":"print"},{"value":"2160-9292","type":"electronic"},{"value":"1939-3539","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,12]]}}}