{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,6]],"date-time":"2026-04-06T10:06:04Z","timestamp":1775469964090,"version":"3.50.1"},"reference-count":148,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"12","license":[{"start":{"date-parts":[[2023,12,1]],"date-time":"2023-12-01T00:00:00Z","timestamp":1701388800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0\/"}],"funder":[{"name":"Institute for interdisciplinary Information Core Technology"},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["31970972"],"award-info":[{"award-number":["31970972"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["11901338"],"award-info":[{"award-number":["11901338"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Tsinghua University Initiative Scientific Research Program"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Pattern Anal. Mach. Intell."],"published-print":{"date-parts":[[2023,12]]},"DOI":"10.1109\/tpami.2023.3300470","type":"journal-article","created":{"date-parts":[[2023,8,1]],"date-time":"2023-08-01T18:09:12Z","timestamp":1690913352000},"page":"15706-15724","source":"Crossref","is-referenced-by-count":41,"title":["Structured Knowledge Distillation for Accurate and Efficient Object Detection"],"prefix":"10.1109","volume":"45","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-3341-183X","authenticated-orcid":false,"given":"Linfeng","family":"Zhang","sequence":"first","affiliation":[{"name":"Institute of Interdisciplinary Information Sciences, Tsinghua University, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9226-3366","authenticated-orcid":false,"given":"Kaisheng","family":"Ma","sequence":"additional","affiliation":[{"name":"Institute of Interdisciplinary Information Sciences, Tsinghua University, Beijing, China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-24574-4_28"},{"key":"ref2","first-page":"91","article-title":"Faster R-CNN: Towards real-time object detection with region proposal networks","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Ren"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.322"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.244"},{"key":"ref5","first-page":"1","article-title":"Deep compression: Compressing deep neural networks with pruning, trained quantization and Huffman coding","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Han"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01237-3_12"},{"key":"ref7","first-page":"1","article-title":"Rethinking the value of network pruning","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Liu"},{"key":"ref8","first-page":"1","article-title":"The lottery ticket hypothesis: Finding sparse, trainable neural networks","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Frankle"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00141"},{"key":"ref10","first-page":"1","article-title":"Incremental network quantization: Towards lossless CNNs with low-precision weights","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Zhou"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00474"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00140"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01264-9_8"},{"key":"ref14","first-page":"1","article-title":"Squeezenet: Alexnet-level accuracy with 50x fewer parameters and < 0.5 mb model size","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Iandola"},{"key":"ref15","article-title":"Distilling the knowledge in a neural network","author":"Hinton","year":"2015"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1145\/1150402.1150464"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.776"},{"key":"ref18","first-page":"1","article-title":"Paying more attention to attention: Improving the performance of convolutional neural networks via attention transfer","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Zagoruyko"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.319"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00813"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00378"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i04.5963"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00489"},{"key":"ref24","first-page":"1","article-title":"FitNets: Hints for thin deep nets","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Romero"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00110"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.754"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00938"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00201"},{"key":"ref29","first-page":"14 759","article-title":"Task-oriented feature distillation","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Zhang"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00409"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00145"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00914"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58610-2_2"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58545-7_34"},{"key":"ref35","first-page":"742","article-title":"Learning efficient object detection models with knowledge distillation","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Chen"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00507"},{"key":"ref37","first-page":"953","article-title":"TKD: Temporal knowledge distillation for active perception","volume-title":"Proc. IEEE Winter Conf. Appl. Comput. Vis.","author":"Bajestani"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00271"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2018.2883743"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00256"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00395"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01005"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/ICME.2019.00009"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2019.8851980"},{"key":"ref45","article-title":"Large scale distributed neural network training through online distillation","author":"Anil","year":"2018"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00444"},{"key":"ref47","article-title":"Label refinery: Improving imageNet classification through label progression","author":"Bagherinezhad","year":"2018"},{"key":"ref48","article-title":"DistilBERT, a distilled version of BERT: Smaller, faster, cheaper and lighter","author":"Sanh","year":"2019"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.emnlp-main.633"},{"key":"ref50","first-page":"1","article-title":"Attention distillation for learning video representations","volume-title":"Proc. Brit. Mach. Vis. Conf.","author":"Liu"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00044"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00367"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00776"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01198"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01339"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i04.5765"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58574-7_39"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00533"},{"key":"ref59","article-title":"SCAN: A scalable neural networks framework towards compact and efficient models","author":"Zhang","year":"2019"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00381"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00694"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01312"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01387"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00045"},{"key":"ref65","first-page":"2351","article-title":"Ensemble distillation for robust model fusion in federated learning","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Lin"},{"key":"ref66","first-page":"4694","article-title":"When does label smoothing help?","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"M\u00fcller"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i04.5866"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr42600.2020.00756"},{"key":"ref69","first-page":"775","article-title":"KDGAN: Knowledge distillation with generative adversarial networks","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Wang"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2023.3248583"},{"key":"ref71","first-page":"16 468","article-title":"Instance-conditional knowledge distillation for object detection","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Kang"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00775"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00219"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2018\/309"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.155"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i3.16350"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00447"},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00339"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01234-2_48"},{"key":"ref80","article-title":"PACT: Parameterized clipping activation for quantized neural networks","author":"Choi","year":"2018"},{"key":"ref81","first-page":"3123","article-title":"BinaryConnect: Training deep neural networks with binary weights during propagations","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Courbariaux"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46493-0_32"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01261-8_25"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00919"},{"key":"ref85","first-page":"1","article-title":"Multi-scale dense networks for resource efficient image classification","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Huang"},{"key":"ref86","first-page":"1","article-title":"Slimmable neural networks","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Yu"},{"key":"ref87","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00189"},{"key":"ref88","article-title":"Not all images are worth 16x16 words: Dynamic vision transformers with adaptive sequence length","author":"Wang","year":"2021"},{"key":"ref89","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01594"},{"key":"ref90","first-page":"2432","article-title":"Glance and focus: A dynamic approach to reducing spatial redundancy in image classification","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Wang"},{"key":"ref91","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_31"},{"key":"ref92","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00244"},{"key":"ref93","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1704.04861"},{"key":"ref94","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00716"},{"key":"ref95","first-page":"6105","article-title":"EfficientNet: Rethinking model scaling for convolutional neural networks","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Tan"},{"key":"ref96","article-title":"EfficientNetV2: Smaller models and faster training","author":"Tan","year":"2021"},{"key":"ref97","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00292"},{"key":"ref98","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2020.03.056"},{"key":"ref99","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.91"},{"key":"ref100","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.690"},{"key":"ref101","article-title":"YOLOv3: An incremental improvement","author":"Redmon","year":"2018"},{"key":"ref102","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00925"},{"key":"ref103","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00682"},{"key":"ref104","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr42600.2020.01079"},{"key":"ref105","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01284"},{"key":"ref106","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2005.38"},{"key":"ref107","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00563"},{"key":"ref108","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.623"},{"key":"ref109","article-title":"Non-local recurrent network for image restoration","author":"Liu","year":"2018"},{"key":"ref110","article-title":"Residual non-local attention networks for image restoration","author":"Zhang","year":"2019"},{"key":"ref111","article-title":"Cross-scale internal graph neural network for image super-resolution","author":"Zhou","year":"2020"},{"key":"ref112","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00320"},{"key":"ref113","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00714"},{"key":"ref114","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00069"},{"key":"ref115","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW.2019.00246"},{"key":"ref116","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00068"},{"key":"ref117","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01031"},{"key":"ref118","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58529-7_2"},{"key":"ref119","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2021.3056895"},{"key":"ref120","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00460"},{"key":"ref121","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"ref122","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.322"},{"key":"ref123","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.324"},{"key":"ref124","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1604.01685"},{"key":"ref125","article-title":"Benchmarking robustness in object detection: Autonomous driving when winter is coming","author":"Michaelis","year":"2019"},{"key":"ref126","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2019.2956516"},{"key":"ref127","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58555-6_16"},{"key":"ref128","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00754"},{"key":"ref129","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"ref130","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00093"},{"key":"ref131","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00975"},{"key":"ref132","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00657"},{"key":"ref133","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"ref134","article-title":"Distilling object detectors with task adaptive regularization","author":"Sun","year":"2020"},{"key":"ref135","first-page":"5213","article-title":"Distilling object detectors with feature richness","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Du"},{"key":"ref136","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i3.20240"},{"key":"ref137","first-page":"1","article-title":"Very deep convolutional networks for large-scale image recognition","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Simonyan"},{"key":"ref138","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref139","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01044"},{"key":"ref140","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"ref141","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.634"},{"key":"ref142","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2010.11929"},{"key":"ref143","first-page":"8024","article-title":"PyTorch: An imperative style, high-performance deep learning library","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Paszke"},{"key":"ref144","article-title":"MMDetection: Open MMLab detection toolbox and benchmark","author":"Chen","year":"2019"},{"key":"ref145","first-page":"1","article-title":"Benchmarking neural network robustness to common corruptions and perturbations","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Hendrycks"},{"key":"ref146","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2021\/628"},{"key":"ref147","first-page":"3351","article-title":"Self-distillation amplifies regularization in Hilbert space","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Mobahi"},{"key":"ref148","article-title":"Revisit knowledge distillation: A teacher-free framework","author":"Yuan","year":"2019"}],"container-title":["IEEE Transactions on Pattern Analysis and Machine Intelligence"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/34\/10308548\/10198386.pdf?arnumber=10198386","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,1]],"date-time":"2024-03-01T16:32:40Z","timestamp":1709310760000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10198386\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,12]]},"references-count":148,"journal-issue":{"issue":"12"},"URL":"https:\/\/doi.org\/10.1109\/tpami.2023.3300470","relation":{},"ISSN":["0162-8828","2160-9292","1939-3539"],"issn-type":[{"value":"0162-8828","type":"print"},{"value":"2160-9292","type":"electronic"},{"value":"1939-3539","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,12]]}}}