{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,2]],"date-time":"2026-06-02T09:16:48Z","timestamp":1780391808083,"version":"3.54.1"},"reference-count":89,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"3","license":[{"start":{"date-parts":[[2024,3,1]],"date-time":"2024-03-01T00:00:00Z","timestamp":1709251200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2024,3,1]],"date-time":"2024-03-01T00:00:00Z","timestamp":1709251200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,3,1]],"date-time":"2024-03-01T00:00:00Z","timestamp":1709251200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100000923","name":"Australian Research Council","doi-asserted-by":"publisher","award":["DE200101283"],"award-info":[{"award-number":["DE200101283"]}],"id":[{"id":"10.13039\/501100000923","id-type":"DOI","asserted-by":"publisher"}]},{"name":"ARC Centre of Excellence in Robotic Vision","award":["CE140100016"],"award-info":[{"award-number":["CE140100016"]}]},{"name":"ARC Discovery","award":["DP210102801"],"award-info":[{"award-number":["DP210102801"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Pattern Anal. Mach. Intell."],"published-print":{"date-parts":[[2024,3]]},"DOI":"10.1109\/tpami.2021.3138337","type":"journal-article","created":{"date-parts":[[2021,12,24]],"date-time":"2021-12-24T20:31:59Z","timestamp":1640377919000},"page":"1589-1602","source":"Crossref","is-referenced-by-count":73,"title":["Improving Semantic Segmentation via Efficient Self-Training"],"prefix":"10.1109","volume":"46","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-6482-6712","authenticated-orcid":false,"given":"Yi","family":"Zhu","sequence":"first","affiliation":[{"name":"Amazon Web Services, Santa Clara, CA, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9585-8581","authenticated-orcid":false,"given":"Zhongyue","family":"Zhang","sequence":"additional","affiliation":[{"name":"Snapchat, Sunnyvale, CA, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4569-5024","authenticated-orcid":false,"given":"Chongruo","family":"Wu","sequence":"additional","affiliation":[{"name":"UC Davis, Davis, CA, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0249-1678","authenticated-orcid":false,"given":"Zhi","family":"Zhang","sequence":"additional","affiliation":[{"name":"Amazon Web Services, Santa Clara, CA, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2388-8618","authenticated-orcid":false,"given":"Tong","family":"He","sequence":"additional","affiliation":[{"name":"Amazon Web Services, Santa Clara, CA, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7816-4238","authenticated-orcid":false,"given":"Hang","family":"Zhang","sequence":"additional","affiliation":[{"name":"Facebook, Menlo Park, CA, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2315-8583","authenticated-orcid":false,"given":"R.","family":"Manmatha","sequence":"additional","affiliation":[{"name":"Amazon Web Services, Santa Clara, CA, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4433-2301","authenticated-orcid":false,"given":"Mu","family":"Li","sequence":"additional","affiliation":[{"name":"Amazon Web Services, Santa Clara, CA, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7963-4721","authenticated-orcid":false,"given":"Alexander","family":"Smola","sequence":"additional","affiliation":[{"name":"Amazon Web Services, Santa Clara, CA, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.350"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.534"},{"key":"ref3","article-title":"BDD100K: A diverse driving video database with scalable annotation tooling","author":"Yu","year":"2018"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.97"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01216-8_12"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-020-01316-z"},{"key":"ref7","article-title":"YouTube-8m: A large-scale video classification benchmark","author":"Abu-El-Haija","year":"2016"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-49409-8_66"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.77"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW.2017.36"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00906"},{"key":"ref12","first-page":"205","article-title":"Improving fast segmentation with teacher-student learning","volume-title":"Proc. Brit. Mach. Vis. Conf.","author":"Xie"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr.2019.00271"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/iccv.2017.606"},{"key":"ref15","first-page":"200","article-title":"Adversarial learning for semi-supervised semantic segmentation","volume-title":"Proc. Brit. Mach. Vis. Conf.","author":"Hung"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2019.2960224"},{"key":"ref17","article-title":"Semi-supervised semantic segmentation needs strong, high-dimensional perturbations","author":"French","year":"2019"},{"key":"ref18","first-page":"297","article-title":"Domain adaptation for semantic segmentation via class-balanced self-training","volume-title":"Proc. Eur. Conf. Comput. Vis.","author":"Zou"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00608"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr42600.2020.01070"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01261-8_20"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.660"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1802.02611"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00591"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr42600.2020.01249"},{"key":"ref27","article-title":"OCNet: Object context network for scene parsing","author":"Yuan","year":"2018"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58539-6_11"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00326"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00685"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01240-3_17"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00690"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2020.3007032"},{"key":"ref34","article-title":"Fast-SCNN: Fast semantic segmentation network","author":"Poudel","year":"2019"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00975"},{"key":"ref36","article-title":"FastFCN: Rethinking dilated convolution in the backbone for semantic segmentation","author":"Wu","year":"2019"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00017"},{"key":"ref38","first-page":"8713","article-title":"Searching for efficient multi-scale architectures for dense image prediction","volume-title":"Proc. 32nd Int. Conf. Neural Inf. Process. Syst.","author":"Chen"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00934"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01191"},{"key":"ref41","article-title":"Billion-scale semi-supervised learning for image classification","author":"Yalniz","year":"2019"},{"key":"ref42","article-title":"Hierarchical multi-scale attention for semantic segmentation","author":"Tao","year":"2020"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58545-7_40"},{"key":"ref44","article-title":"Semi-supervised semantic segmentation via dynamic self-training and class-balanced curriculum","author":"Feng","year":"2020"},{"key":"ref45","article-title":"Rethinking pre-training and self-training","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Zoph"},{"key":"ref46","first-page":"1994","article-title":"CyCADA: Cycle-consistent adversarial domain adaptation","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Hoffman"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00780"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00262"},{"key":"ref49","article-title":"Category anchor-guided unsupervised domain adaptation for semantic segmentation","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Zhang"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00686"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00189"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01053"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00219"},{"key":"ref54","article-title":"FixMatch: Simplifying semi-supervised learning with consistency and confidence","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Sohn"},{"key":"ref55","first-page":"896","article-title":"Pseudo-Label:The simple and efficient semi-supervised learning method for deep neural networks","volume-title":"Proc. Int. Conf. Mach. Learn. Workshops","author":"Lee"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2858821"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00023"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-88682-2_5"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-014-0733-5"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2011.6126343"},{"key":"ref61","article-title":"ParseNet: Looking wider to see better","volume-title":"Proc. Int. Conf. Learn Representations","author":"Liu"},{"key":"ref62","article-title":"High-performance semantic segmentation using very deep fully convolutional networks","author":"Wu","year":"2016"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00065"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01219-9_25"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2019.01.006"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2017.2699184"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01269"},{"key":"ref68","article-title":"Pseudoseg: Designing pseudo labels for semantic segmentation","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Zou"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00106"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01246-5_36"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00388"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00532"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00692"},{"key":"ref74","article-title":"High-Resolution representations for labeling pixels and regions","author":"Sun","year":"2019"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00926"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00533"},{"key":"ref77","first-page":"244","article-title":"Global aggregation then local distribution in fully convolutional networks","volume-title":"Proc. Brit. Mach. Vis. Conf.","author":"Li"},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58520-4_26"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58548-8_7"},{"key":"ref80","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-021-01445-z"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01374"},{"key":"ref82","article-title":"Mixed precision training","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Micikevicius"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.75"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58610-2_29"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00858"},{"key":"ref86","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-019-01188-y"},{"key":"ref87","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00909"},{"key":"ref88","article-title":"Rethinking atrous convolution for semantic image segmentation","author":"Chen","year":"2017"},{"key":"ref89","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00747"}],"container-title":["IEEE Transactions on Pattern Analysis and Machine Intelligence"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/34\/10423572\/09663011.pdf?arnumber=9663011","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,1]],"date-time":"2024-03-01T21:35:35Z","timestamp":1709328935000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9663011\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,3]]},"references-count":89,"journal-issue":{"issue":"3"},"URL":"https:\/\/doi.org\/10.1109\/tpami.2021.3138337","relation":{},"ISSN":["0162-8828","2160-9292","1939-3539"],"issn-type":[{"value":"0162-8828","type":"print"},{"value":"2160-9292","type":"electronic"},{"value":"1939-3539","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,3]]}}}