{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,5]],"date-time":"2026-06-05T16:09:50Z","timestamp":1780675790727,"version":"3.54.1"},"reference-count":125,"publisher":"Springer Science and Business Media LLC","issue":"8","license":[{"start":{"date-parts":[[2025,5,12]],"date-time":"2025-05-12T00:00:00Z","timestamp":1747008000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,5,12]],"date-time":"2025-05-12T00:00:00Z","timestamp":1747008000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Comput Vis"],"published-print":{"date-parts":[[2025,8]]},"DOI":"10.1007\/s11263-025-02437-z","type":"journal-article","created":{"date-parts":[[2025,5,12]],"date-time":"2025-05-12T16:13:18Z","timestamp":1747066398000},"page":"5455-5482","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["An Information Theory-Inspired Strategy for Automated Network Pruning"],"prefix":"10.1007","volume":"133","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-6855-5403","authenticated-orcid":false,"given":"Xiawu","family":"Zheng","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yuexiao","family":"Ma","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Teng","family":"Xi","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Gang","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Errui","family":"Ding","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yuchao","family":"Li","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jie","family":"Chen","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yonghong","family":"Tian","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Rongrong","family":"Ji","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2025,5,12]]},"reference":[{"key":"2437_CR1","unstructured":"Abdelfattah, M.S., Mehrotra, A., Dudziak, \u0141., & Lane, N.D. (2021) Zero-cost proxies for lightweight NAS. arXiv preprint arXiv:2101.08134"},{"key":"2437_CR2","unstructured":"Achiam, J., Adler, S., Agarwal, S., Ahmad, L., Akkaya, I., Aleman, F.L., Almeida, D., Altenschmidt, J., Altman, S., & Anadkat, S., et al. (2023) Gpt-4 technical report. arXiv preprint arXiv:2303.08774"},{"key":"2437_CR3","doi-asserted-by":"crossref","unstructured":"Ahn, S., Hu, S.X., Damianou, A., Lawrence, N.D., & Dai, Z. (2019) Variational information distillation for knowledge transfer. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 9163\u20139171","DOI":"10.1109\/CVPR.2019.00938"},{"key":"2437_CR4","unstructured":"Alemi, A.A., Fischer, I., Dillon, J.V., & Murphy, K. (2016) Deep variational information bottleneck. arXiv preprint arXiv:1612.00410"},{"key":"2437_CR5","doi-asserted-by":"crossref","unstructured":"Alwani, M., Wang, Y., & Madhavan, V. (2022) Decore: Deep compression with reinforcement learning. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 12349\u201312359","DOI":"10.1109\/CVPR52688.2022.01203"},{"key":"2437_CR6","doi-asserted-by":"publisher","DOI":"10.1093\/oso\/9780195099713.001.0001","volume-title":"Evolutionary Algorithms in Theory and Practice: Evolution Strategies","author":"T Back","year":"1996","unstructured":"Back, T. (1996). Evolutionary Algorithms in Theory and Practice: Evolution Strategies. Genetic Algorithms: Evolutionary Programming."},{"key":"2437_CR7","first-page":"129","volume":"2","author":"D Blalock","year":"2020","unstructured":"Blalock, D., Gonzalez Ortiz, J. J., Frankle, J., & Guttag, J. (2020). What is the state of neural network pruning? Proceedings of Machine Learning and Systems, 2, 129\u2013146.","journal-title":"Proceedings of Machine Learning and Systems"},{"key":"2437_CR8","doi-asserted-by":"crossref","unstructured":"Caron, M., Touvron, H., Misra, I., J\u00e9gou, H., Mairal, J., Bojanowski, P., & Joulin, A. (2021) Emerging properties in self-supervised vision transformers. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 9650\u20139660","DOI":"10.1109\/ICCV48922.2021.00951"},{"key":"2437_CR9","doi-asserted-by":"crossref","unstructured":"Chen, L., Papandreou, G., Kokkinos, I., Murphy, K., & Yuille, A.L. (2018) Deeplab: Semantic image segmentation with deep convolutional nets, atrous convolution, and fully connected CRFS. In IEEE transactions on pattern analysis and machine intelligence (TPAMI)","DOI":"10.1109\/TPAMI.2017.2699184"},{"key":"2437_CR10","unstructured":"Chen, L.-C., Papandreou, G., Schroff, F., & Adam, H. (2017) Rethinking atrous convolution for semantic image segmentation. arXiv preprint arXiv:1706.05587"},{"key":"2437_CR11","doi-asserted-by":"crossref","unstructured":"Chen, X., Xie, S., & He, K. (2021) An empirical study of training self-supervised vision transformers. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 9640\u20139649","DOI":"10.1109\/ICCV48922.2021.00950"},{"key":"2437_CR12","doi-asserted-by":"crossref","unstructured":"Chen, P., Zhang, M., Shen, Y., Sheng, K., Gao, Y., Sun, X., Li, K., & Shen, C. (2022) Efficient decoder-free object detection with transformers. In European conference on computer vision, pp. 70\u201386. Springer","DOI":"10.1007\/978-3-031-20080-9_5"},{"issue":"1","key":"2437_CR13","doi-asserted-by":"publisher","first-page":"208","DOI":"10.1007\/s11263-023-01852-4","volume":"132","author":"X Chen","year":"2024","unstructured":"Chen, X., Ding, M., Wang, X., Xin, Y., Mo, S., Wang, Y., Han, S., Luo, P., Zeng, G., & Wang, J. (2024). Context autoencoder for self-supervised representation learning. International Journal of Computer Vision, 132(1), 208\u2013223.","journal-title":"International Journal of Computer Vision"},{"key":"2437_CR14","unstructured":"Cover, T.M. (1999) Elements of information theory"},{"key":"2437_CR15","unstructured":"Dai, B., Zhu, C., Guo, B., & Wipf, D. (2018) Compressing neural networks using the variational information bottleneck. In International conference on machine learning, pp. 1135\u20131144. PMLR"},{"key":"2437_CR16","unstructured":"Dong, X., & Yang, Y. (2019) Network pruning via transformable architecture search. In Advances in neural information processing systems"},{"key":"2437_CR17","doi-asserted-by":"crossref","unstructured":"Elkerdawy, S., Elhoushi, M., Zhang, H., & Ray, N. (2022) Fire together wire together: A dynamic pruning approach with self-supervised mask prediction. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 12454\u201312463","DOI":"10.1109\/CVPR52688.2022.01213"},{"key":"2437_CR18","doi-asserted-by":"crossref","unstructured":"Everingham, M., Van Gool, L., Williams, C. K., Winn, J., & Zisserman, A. (2010). The pascal visual object classes (voc) challenge. International Journal of Computer Vision,88(2), 303\u2013338.","DOI":"10.1007\/s11263-009-0275-4"},{"issue":"4","key":"2437_CR19","doi-asserted-by":"publisher","first-page":"173","DOI":"10.1017\/S2040618500033670","volume":"3","author":"WN Everitt","year":"1958","unstructured":"Everitt, W. N. (1958). A note on positive definite matrices. Proceedings of the Glasgow Mathematical Association, 3(4), 173\u2013175. https:\/\/doi.org\/10.1017\/S2040618500033670","journal-title":"Proceedings of the Glasgow Mathematical Association"},{"key":"2437_CR20","unstructured":"Frankle, J., & Carbin, M. (2018) The lottery ticket hypothesis: Finding sparse, trainable neural networks. In International conference on learning representations"},{"key":"2437_CR21","unstructured":"Frantar, E., & Alistarh, D. (2023) Sparsegpt: Massive language models can be accurately pruned in one-shot. In International conference on machine learning, pp. 10323\u201310337. PMLR"},{"key":"2437_CR22","doi-asserted-by":"crossref","unstructured":"Gao, Z., Wang, L., Han, B., & Guo, S. (2022) Adamixer: A fast-converging query-based object detector. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 5364\u20135373","DOI":"10.1109\/CVPR52688.2022.00529"},{"key":"2437_CR23","doi-asserted-by":"crossref","unstructured":"Girshick, R. (2015) Fast r-cnn. In: International conference on computer vision (ICCV)","DOI":"10.1109\/ICCV.2015.169"},{"key":"2437_CR24","unstructured":"Goldfeld, Z., van\u00a0den Berg, E., Greenewald, K., Melnyk, I., Nguyen, N., Kingsbury, B., & Polyanskiy, Y. (2018) Estimating information flow in neural networks. arxiv e-prints, page. arXiv preprint arXiv:1810.05728"},{"key":"2437_CR25","unstructured":"Gomez, A.N., Ren, M., Urtasun, R., & Grosse, R.B. (2017) The reversible residual network: Backpropagation without storing activations. In Advances in neural information processing systems 30"},{"key":"2437_CR26","doi-asserted-by":"crossref","unstructured":"Gretton, A., Bousquet, O., Smola, A., & Sch\u00f6lkopf, B. (2005) Measuring statistical dependence with hilbert-schmidt norms. In International conference on algorithmic learning theory, pp. 63\u201377. Springer","DOI":"10.1007\/11564089_7"},{"key":"2437_CR27","doi-asserted-by":"crossref","unstructured":"He, K., Chen, X., Xie, S., Li, Y., Doll\u00e1r, P., & Girshick, R. (2022) Masked autoencoders are scalable vision learners. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 16000\u201316009","DOI":"10.1109\/CVPR52688.2022.01553"},{"key":"2437_CR28","doi-asserted-by":"crossref","unstructured":"He, Y., Lin, J., Liu, Z., Wang, H., Li, L.-J., & Han, S. (2018) Amc: Automl for model compression and acceleration on mobile devices. In Proceedings of the European conference on computer vision (ECCV), pp. 784\u2013800","DOI":"10.1007\/978-3-030-01234-2_48"},{"key":"2437_CR29","doi-asserted-by":"crossref","unstructured":"He, Y., Liu, P., Wang, Z., Hu, Z., & Yang, Y. (2019) Filter pruning via geometric median for deep convolutional neural networks acceleration. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 4340\u20134349","DOI":"10.1109\/CVPR.2019.00447"},{"key":"2437_CR30","doi-asserted-by":"crossref","unstructured":"He, Y., Liu, P., Zhu, L., & Yang, Y. (2022) Filter pruning by switching to neighboring cnns with good attributes. In IEEE transactions on neural networks and learning systems","DOI":"10.1109\/TNNLS.2022.3149332"},{"key":"2437_CR31","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., & Sun, J. (2016) Deep residual learning for image recognition. In: Computer vision and pattern recognition (CVPR)","DOI":"10.1109\/CVPR.2016.90"},{"key":"2437_CR32","doi-asserted-by":"crossref","unstructured":"Hoeffding, W. (1994) Probability inequalities for sums of bounded random variables. In The collected works of Wassily Hoeffding, pp. 409\u2013426","DOI":"10.1007\/978-1-4612-0865-5_26"},{"key":"2437_CR33","first-page":"9782","volume":"33","author":"L Hou","year":"2020","unstructured":"Hou, L., Huang, Z., Shang, L., Jiang, X., Chen, X., & Liu, Q. (2020). Dynabert: Dynamic bert with adaptive width and depth. Advances in Neural Information Processing Systems, 33, 9782\u20139793.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"2437_CR34","doi-asserted-by":"crossref","unstructured":"Howard, A., Sandler, M., Chu, G., Chen, L.-C., Chen, B., Tan, M., Wang, W., Zhu, Y., Pang, R., & Vasudevan, V. (2019) Searching for mobilenetv3. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 1314\u20131324","DOI":"10.1109\/ICCV.2019.00140"},{"key":"2437_CR35","unstructured":"Howard, A.G., Zhu, M., Chen, B., Kalenichenko, D., Wang, W., Weyand, T., Andreetto, M., & Adam, H. (2017) Mobilenets: Efficient convolutional neural networks for mobile vision applications. arXiv preprint arXiv:1704.04861"},{"key":"2437_CR36","doi-asserted-by":"crossref","unstructured":"Huang, G., Liu, Z., Van Der\u00a0Maaten, L., & Weinberger, K.Q. (2017) Densely connected convolutional networks. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 4700\u20134708","DOI":"10.1109\/CVPR.2017.243"},{"key":"2437_CR37","doi-asserted-by":"crossref","unstructured":"Huang, W., Peng, Z., Dong, L., Wei, F., Jiao, J., & Ye, Q. (2023) Generic-to-specific distillation of masked autoencoders. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 15996\u201316005","DOI":"10.1109\/CVPR52729.2023.01535"},{"key":"2437_CR38","unstructured":"Ioffe, S., & Szegedy, C. (2015) Batch normalization: Accelerating deep network training by reducing internal covariate shift. In International conference on machine learning, pp. 448\u2013456. PMLR"},{"key":"2437_CR39","doi-asserted-by":"crossref","unstructured":"Jacob, B., Kligys, S., Chen, B., Zhu, M., Tang, M., Howard, A., Adam, H., & Kalenichenko, D. (2018) Quantization and training of neural networks for efficient integer-arithmetic-only inference. In: Computer vision and pattern recognition (CVPR)","DOI":"10.1109\/CVPR.2018.00286"},{"key":"2437_CR40","unstructured":"Jacobsen, J.-H., Smeulders, A., & Oyallon, E. (2018) i-revnet: Deep invertible networks. arXiv preprint arXiv:1802.07088"},{"key":"2437_CR41","doi-asserted-by":"crossref","unstructured":"Jia, D., Yuan, Y., He, H., Wu, X., Yu, H., Lin, W., Sun, L., Zhang, C., & Hu, H. (2023) Detrs with hybrid matching. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 19702\u201319712","DOI":"10.1109\/CVPR52729.2023.01887"},{"key":"2437_CR42","unstructured":"Jocher, G., Nishimura, K., Mineeva, T., & Vilarino, R. (2021) Yolov5. https:\/\/github.com\/ultralytics\/yolov5"},{"key":"2437_CR43","doi-asserted-by":"crossref","unstructured":"Kim, B., Jo, Y., Kim, J., & Kim, S. (2023) Misalign, contrast then distill: Rethinking misalignments in language-image pre-training. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 2563\u20132572","DOI":"10.1109\/ICCV51070.2023.00242"},{"key":"2437_CR44","unstructured":"Kornblith, S., Norouzi, M., Lee, H., & Hinton, G. (2019) Similarity of neural network representations revisited. In International conference on machine learning, pp. 3519\u20133529. PMLR"},{"key":"2437_CR45","unstructured":"Kraft, D., et al. (1988) A software package for sequential quadratic programming"},{"key":"2437_CR46","unstructured":"Krizhevsky, A., Sutskever, I., & Hinton, G.E. (2012) Imagenet classification with deep convolutional neural networks. In: Advances in neural information processing systems"},{"key":"2437_CR47","unstructured":"Kusupati, A., Ramanujan, V., Somani, R., Wortsman, M., Jain, P., Kakade, S., & Farhadi, A. (2020) Soft threshold weight reparameterization for learnable sparsity. In International conference on machine learning, pp. 5544\u20135555. PMLR"},{"key":"2437_CR48","doi-asserted-by":"crossref","unstructured":"LeCun, Y., Bengio, Y., & Hinton, G. (2015). Deep learning. nature,","DOI":"10.1038\/nature14539"},{"key":"2437_CR49","doi-asserted-by":"crossref","unstructured":"LeCun, Y., Bottou, L., Bengio, Y., & Haffner, P., et al. (1998) Gradient-based learning applied to document recognition. In Proceedings of the IEEE","DOI":"10.1109\/5.726791"},{"key":"2437_CR50","unstructured":"Lee, N., Ajanthan, T., & Torr, P.H. (2018) Snip: Single-shot network pruning based on connection sensitivity. arXiv preprint arXiv:1810.02340"},{"key":"2437_CR51","first-page":"1008","volume":"35","author":"J Lee","year":"2022","unstructured":"Lee, J., Kim, J., Shon, H., Kim, B., Kim, S. H., Lee, H., & Kim, J. (2022). Uniclip: Unified framework for contrastive language-image pre-training. Advances in Neural Information Processing Systems, 35, 1008\u20131019.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"2437_CR52","doi-asserted-by":"crossref","unstructured":"Li, Y., Adamczewski, K., Li, W., Gu, S., Timofte, R., & Van\u00a0Gool, L. (2022) Revisiting random channel pruning for neural network compression. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 191\u2013201","DOI":"10.1109\/CVPR52688.2022.00029"},{"key":"2437_CR53","unstructured":"Li, H., Kadav, A., Durdanovic, I., Samet, H., & Graf, H.P. (2016) Pruning filters for efficient convnets. In International conference on learning representations (ICLR)"},{"key":"2437_CR54","unstructured":"Li, Y., Liang, F., Zhao, L., Cui, Y., Ouyang, W., Shao, J., Yu, F., & Yan, J. (2021) Supervision exists everywhere: A data efficient contrastive language-image pre-training paradigm. arXiv preprint arXiv:2110.05208"},{"key":"2437_CR55","doi-asserted-by":"crossref","unstructured":"Li, C., Wang, G., Wang, B., Liang, X., Li, Z., & Chang, X. (2022) Ds-net++: Dynamic weight slicing for efficient inference in cnns and vision transformers. In IEEE transactions on pattern analysis and machine intelligence","DOI":"10.1109\/TPAMI.2022.3194044"},{"key":"2437_CR56","doi-asserted-by":"crossref","unstructured":"Li, F., Zeng, A., Liu, S., Zhang, H., Li, H., Zhang, L., & Ni, L.M. (2023) Lite detr: An interleaved multi-scale encoder for efficient detr. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 18558\u201318567","DOI":"10.1109\/CVPR52729.2023.01780"},{"key":"2437_CR57","doi-asserted-by":"crossref","unstructured":"Lin, H., Bai, H., Liu, Z., Hou, L., Sun, M., Song, L., Wei, Y., & Sun, Z. (2024) Mope-clip: Structured pruning for efficient vision-language models with module-wise pruning error metric. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 27370\u201327380","DOI":"10.1109\/CVPR52733.2024.02584"},{"key":"2437_CR58","doi-asserted-by":"crossref","unstructured":"Lin, S., Ji, R., Li, Y., Wu, Y., Huang, F., & Zhang, B. (2018) Accelerating convolutional networks via global & dynamic filter pruning. In: IJCAI, pp. 2425\u20132432","DOI":"10.24963\/ijcai.2018\/336"},{"key":"2437_CR59","doi-asserted-by":"crossref","unstructured":"Lin, M., Ji, R., Wang, Y., Zhang, Y., Zhang, B., Tian, Y., & Shao, L. (2020) Hrank: Filter pruning using high-rank feature map. In IEEE conference on computer vision and pattern recognition","DOI":"10.1109\/CVPR42600.2020.00160"},{"key":"2437_CR60","doi-asserted-by":"crossref","unstructured":"Lin, S., Ji, R., Yan, C., Zhang, B., Cao, L., Ye, Q., Huang, F., & Doermann, D. (2019) Towards optimal structured cnn pruning via generative adversarial learning. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 2790\u20132799","DOI":"10.1109\/CVPR.2019.00290"},{"key":"2437_CR61","unstructured":"Lin, M., Ji, R., Zhang, Y., Zhang, B., Wu, Y., & Tian, Y. (yyy) Channel pruning via automatic structure search"},{"key":"2437_CR62","unstructured":"Lin, J., Mao, X., Chen, Y., Xu, L., He, Y., & Xue, H. (2022) Detr: Decoder-only detr with computationally efficient cross-scale attention. arXiv preprint arXiv:2203.00860"},{"key":"2437_CR63","unstructured":"Liu, H., Li, C., Wu, Q., & Lee, Y.J. (2024) Visual instruction tuning. In Advances in neural information processing systems 36"},{"key":"2437_CR64","doi-asserted-by":"crossref","unstructured":"Liu, Z., Lin, Y., Cao, Y., Hu, H., Wei, Y., Zhang, Z., Lin, S., & Guo, B. (2021) Swin transformer: Hierarchical vision transformer using shifted windows. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 10012\u201310022","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"2437_CR65","doi-asserted-by":"crossref","unstructured":"Liu, Z., Mu, H., Zhang, X., Guo, Z., Yang, X., Cheng, K.-T., & Sun, J. (2019) Metapruning: Meta learning for automatic neural network channel pruning. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 3296\u20133305","DOI":"10.1109\/ICCV.2019.00339"},{"key":"2437_CR66","unstructured":"Liu, Z., Sun, M., Zhou, T., Huang, G., & Darrell, T. (2018) Rethinking the value of network pruning. In International conference on learning representations"},{"key":"2437_CR67","doi-asserted-by":"crossref","unstructured":"Long, J., Shelhamer, E., & Darrell, T. (2015) Fully convolutional networks for semantic segmentation. In: Computer vision and pattern recognition (CVPR)","DOI":"10.1109\/CVPR.2015.7298965"},{"issue":"2","key":"2437_CR68","doi-asserted-by":"publisher","first-page":"57","DOI":"10.1027\/1614-2241.2.2.57","volume":"2","author":"U Lorenzo-Seva","year":"2006","unstructured":"Lorenzo-Seva, U., & Ten Berge, J. M. (2006). Tucker\u2019s congruence coefficient as a meaningful index of factor similarity. Methodology, 2(2), 57\u201364.","journal-title":"Methodology"},{"key":"2437_CR69","unstructured":"Louizos, C., Welling, M., & Kingma, D.P. (2018) Learning sparse neural networks through l_0 regularization. In International conference on learning representations"},{"key":"2437_CR70","doi-asserted-by":"crossref","unstructured":"Luo, J.-H., Wu, J., & Lin, W. (2017) Thinet: A filter level pruning method for deep neural network compression. In International conference on computer vision (ICCV)","DOI":"10.1109\/ICCV.2017.541"},{"key":"2437_CR71","unstructured":"Luo, G., Zhou, Y., Ren, T., Chen, S., Sun, X., & Ji, R. (2024) Cheap and quick: Efficient vision-language instruction tuning for large language models. In Advances in neural information processing systems 36"},{"key":"2437_CR72","doi-asserted-by":"crossref","unstructured":"Ma, W.-D.K., Lewis, J., & Kleijn, W.B. (2020) The hsic bottleneck: Deep learning without back-propagation. In Proceedings of the AAAI conference on artificial intelligence, vol. 34, pp. 5085\u20135092","DOI":"10.1609\/aaai.v34i04.5950"},{"key":"2437_CR73","first-page":"21702","volume":"36","author":"X Ma","year":"2023","unstructured":"Ma, X., Fang, G., & Wang, X. (2023). Llm-pruner: On the structural pruning of large language models. Advances in Neural Information Processing Systems, 36, 21702\u201321720.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"2437_CR74","unstructured":"Mohri, M., Rostamizadeh, A., & Talwalkar, A. (2018) Foundations of machine learning"},{"key":"2437_CR75","doi-asserted-by":"crossref","unstructured":"Molchanov, P., Mallya, A., Tyree, S., Frosio, I., & Kautz, J. (2019) Importance estimation for neural network pruning. In Proceedings of the IEEE conference on computer vision and pattern recognition","DOI":"10.1109\/CVPR.2019.01152"},{"key":"2437_CR76","doi-asserted-by":"crossref","unstructured":"Molchanov, P., Mallya, A., Tyree, S., Frosio, I., & Kautz, J. (2019) Importance estimation for neural network pruning. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 11264\u201311272","DOI":"10.1109\/CVPR.2019.01152"},{"key":"2437_CR77","unstructured":"Molchanov, P., Tyree, S., Karras, T., Aila, T., & Kautz, J. (2017) Pruning convolutional neural networks for resource efficient inference. In 5th international conference on learning representations, ICLR"},{"key":"2437_CR78","doi-asserted-by":"crossref","unstructured":"Mu, N., Kirillov, A., Wagner, D., & Xie, S. (2022) Slip: Self-supervision meets language-image pre-training. In european conference on computer vision, pp. 529\u2013544. Springer","DOI":"10.1007\/978-3-031-19809-0_30"},{"key":"2437_CR79","first-page":"24898","volume":"34","author":"B Pan","year":"2021","unstructured":"Pan, B., Panda, R., Jiang, Y., Wang, Z., Feris, R., & Oliva, A. (2021). Ia-red $$^2$$: Interpretability-aware redundancy reduction for vision transformers. Advances in Neural Information Processing Systems, 34, 24898\u201324911.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"2437_CR80","unstructured":"Paszke, A., Gross, S., Chintala, S., Chanan, G., Yang, E., DeVito, Z., Lin, Z., Desmaison, A., Antiga, L., & Lerer, A. (2017) Automatic differentiation in pytorch"},{"key":"2437_CR81","unstructured":"Radford, A., Kim, J.W., Hallacy, C., Ramesh, A., Goh, G., Agarwal, S., Sastry, G., Askell, A., Mishkin, P., & Clark, J. (2021) Learning transferable visual models from natural language supervision. In International conference on machine learning, pp. 8748\u20138763. PMLR"},{"key":"2437_CR82","doi-asserted-by":"crossref","unstructured":"Ren, S., He, K., Girshick, R., & Sun, J. (2017) Faster r-cnn: Towards real-time object detection with region proposal networks. In IEEE transactions on pattern analysis and machine intelligence (TPAMI)","DOI":"10.1109\/TPAMI.2016.2577031"},{"key":"2437_CR83","doi-asserted-by":"crossref","unstructured":"Ren, S., Wei, F., Zhang, Z., & Hu, H. (2023) Tinymim: An empirical study of distilling mim pre-trained models. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 3687\u20133697","DOI":"10.1109\/CVPR52729.2023.00359"},{"issue":"6","key":"2437_CR84","doi-asserted-by":"publisher","first-page":"1137","DOI":"10.1109\/TPAMI.2016.2577031","volume":"39","author":"S Ren","year":"2016","unstructured":"Ren, S., He, K., Girshick, R., & Sun, J. (2016). Faster r-cnn: Towards real-time object detection with region proposal networks. IEEE Transactions on Pattern Analysis and Machine Intelligence, 39(6), 1137\u20131149.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"issue":"3","key":"2437_CR85","first-page":"257","volume":"25","author":"P Robert","year":"1976","unstructured":"Robert, P., & Escoufier, Y. (1976). A unifying tool for linear multivariate statistical methods: The RV-coefficient. Journal of the Royal Statistical Society: Series C (Applied Statistics), 25(3), 257\u2013265.","journal-title":"Journal of the Royal Statistical Society: Series C (Applied Statistics)"},{"key":"2437_CR86","doi-asserted-by":"crossref","unstructured":"Russakovsky, O., Deng, J., Su, H., Krause, J., Satheesh, S., Ma, S., Huang, Z., Karpathy, A., Khosla, A., & Bernstein, M., et al. (2015) Imagenet large scale visual recognition challenge. IJCV","DOI":"10.1007\/s11263-015-0816-y"},{"issue":"3","key":"2437_CR87","doi-asserted-by":"publisher","first-page":"289","DOI":"10.1007\/s00799-022-00329-y","volume":"23","author":"T Saikh","year":"2022","unstructured":"Saikh, T., Ghosal, T., Mittal, A., Ekbal, A., & Bhattacharyya, P. (2022). Scienceqa: A novel resource for question answering on scholarly articles. International Journal on Digital Libraries, 23(3), 289\u2013301.","journal-title":"International Journal on Digital Libraries"},{"key":"2437_CR88","doi-asserted-by":"crossref","unstructured":"Sandler, M., Howard, A., Zhu, M., Zhmoginov, A., & Chen, L.-C. (2018) Mobilenetv2: Inverted residuals and linear bottlenecks. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 4510\u20134520","DOI":"10.1109\/CVPR.2018.00474"},{"key":"2437_CR89","first-page":"11380","volume":"33","author":"P Savarese","year":"2020","unstructured":"Savarese, P., Silva, H., & Maire, M. (2020). Winning the lottery with continuous sparsification. Advances in Neural Information Processing Systems, 33, 11380\u201311390.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"2437_CR90","doi-asserted-by":"crossref","unstructured":"Saxe, A.M., Bansal, Y., Dapello, J., Advani, M., Kolchinsky, A., Tracey, B.D., & Cox, D.D. (2019) On the information bottleneck theory of deep learning. In Journal of statistical mechanics: Theory and experiment","DOI":"10.1088\/1742-5468\/ab3985"},{"key":"2437_CR91","unstructured":"Shwartz-Ziv, R., & Tishby, N. (2017) Opening the black box of deep neural networks via information. CoRR"},{"key":"2437_CR92","unstructured":"Shwartz-Ziv, R., Painsky, A., & Tishby, N. (2018) Representation compression and generalization in deep neural networks"},{"key":"2437_CR93","unstructured":"Simonyan, K., & Zisserman, A. (2014) Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:1409.1556"},{"key":"2437_CR94","unstructured":"Song, H., Sun, D., Chun, S., Jampani, V., Han, D., Heo, B., Kim, W., & Yang, M.-H. (2022) An extendable, efficient and effective transformer-based object detector. arXiv preprint arXiv:2204.07962"},{"key":"2437_CR95","unstructured":"Sun, M., Liu, Z., Bair, A., & Kolter, J.Z. (2023) A simple and effective pruning approach for large language models. arXiv preprint arXiv:2306.11695"},{"key":"2437_CR96","unstructured":"Tan, M., & Le, Q. (2019) Efficientnet: Rethinking model scaling for convolutional neural networks. In International conference on machine learning, pp. 6105\u20136114. PMLR"},{"key":"2437_CR97","doi-asserted-by":"crossref","unstructured":"Tan, M., Chen, B., Pang, R., Vasudevan, V., Sandler, M., Howard, A., & Le, Q.V. (2019) Mnasnet: Platform-aware neural architecture search for mobile. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 2820\u20132828","DOI":"10.1109\/CVPR.2019.00293"},{"key":"2437_CR98","doi-asserted-by":"crossref","unstructured":"Tan, M., Pang, R., & Le, Q.V. (2020) Efficientdet: Scalable and efficient object detection. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 10781\u201310790","DOI":"10.1109\/CVPR42600.2020.01079"},{"key":"2437_CR99","first-page":"6377","volume":"33","author":"H Tanaka","year":"2020","unstructured":"Tanaka, H., Kunin, D., Yamins, D. L., & Ganguli, S. (2020). Pruning neural networks without any data by iteratively conserving synaptic flow. Advances in Neural Information Processing Systems, 33, 6377\u20136389.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"2437_CR100","unstructured":"Tishby, N., Pereira, F.C., & Bialek, W. (1999) The information bottleneck method. In: Proc. of the 37-th annual allerton conference on communication, control and computing"},{"key":"2437_CR101","unstructured":"Touvron, H., Cord, M., Douze, M., Massa, F., Sablayrolles, A., & J\u00e9gou, H. (2021) Training data-efficient image transformers & distillation through attention. In International conference on machine learning, pp. 10347\u201310357. PMLR"},{"key":"2437_CR102","unstructured":"Turner, J., Crowley, E.J., O\u2019Boyle, M., Storkey, A., & Gray, G. (2019) Blockswap: Fisher-guided block substitution for network compression on a budget. arXiv preprint arXiv:1906.04113"},{"key":"2437_CR103","unstructured":"Wang, J., Bai, H., Wu, J., Shi, X., Huang, J., King, I., Lyu, M., & Cheng, J. (2020) Revisiting parameter sharing for automatic neural channel number search. In Advances in neural information processing systems 33"},{"key":"2437_CR104","doi-asserted-by":"crossref","unstructured":"Wang, C.-Y., Bochkovskiy, A., & Liao, H.-Y.M. (2023) Yolov7: Trainable bag-of-freebies sets new state-of-the-art for real-time object detectors. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 7464\u20137475","DOI":"10.1109\/CVPR52729.2023.00721"},{"key":"2437_CR105","doi-asserted-by":"crossref","unstructured":"Wang, J., Chen, Y., Chakraborty, R., & Yu, S.X. (2020) Orthogonal convolutional neural networks. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 11505\u201311515","DOI":"10.1109\/CVPR42600.2020.01152"},{"key":"2437_CR106","unstructured":"Wang, S., Gao, J., Li, Z., Zhang, X., & Hu, W. (2023) A closer look at self-supervised lightweight vision transformers. In International conference on machine learning, pp. 35624\u201335641. PMLR"},{"key":"2437_CR107","unstructured":"Wang, Z., Huang, S.-L., Kuruoglu, E.E., Sun, J., Chen, X., & Zheng, Y. (2021) Pac-bayes information bottleneck. arXiv preprint arXiv:2109.14509"},{"key":"2437_CR108","doi-asserted-by":"crossref","unstructured":"Wang, T., Yuan, L., Chen, Y., Feng, J., & Yan, S. (2021) Pnp-detr: Towards efficient visual analysis with transformers. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 4661\u20134670","DOI":"10.1109\/ICCV48922.2021.00462"},{"key":"2437_CR109","doi-asserted-by":"crossref","unstructured":"Wang, T., Zhou, W., Zeng, Y., & Zhang, X. (2022) Efficientvlm: Fast and accurate vision-language models via knowledge distillation and modal-adaptive pruning. arXiv preprint arXiv:2210.07795","DOI":"10.18653\/v1\/2023.findings-acl.873"},{"key":"2437_CR110","unstructured":"Wen, W., Wu, C., Wang, Y., Chen, Y., & Li, H. (2016) Learning structured sparsity in deep neural networks. In Advances in neural information processing systems (NeurIPS)"},{"key":"2437_CR111","unstructured":"Wortsman, M., Farhadi, A., & Rastegari, M. (2019) Discovering neural wirings. In Advances in neural information processing systems 32"},{"key":"2437_CR112","doi-asserted-by":"crossref","unstructured":"Wu, B., Dai, X., Zhang, P., Wang, Y., Sun, F., Wu, Y., Tian, Y., Vajda, P., Jia, Y., & Keutzer, K. (2019) Fbnet: Hardware-aware efficient convnet design via differentiable neural architecture search. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition","DOI":"10.1109\/CVPR.2019.01099"},{"key":"2437_CR113","doi-asserted-by":"crossref","unstructured":"Wu, K., Peng, H., Zhou, Z., Xiao, B., Liu, M., Yuan, L., Xuan, H., Valenzuela, M., Chen, X.S., & Wang, X. (2023) Tinyclip: Clip distillation via affinity mimicking and weight inheritance. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 21970\u201321980","DOI":"10.1109\/ICCV51070.2023.02008"},{"key":"2437_CR114","doi-asserted-by":"crossref","unstructured":"Yang, K., Deng, J., An, X., Li, J., Feng, Z., Guo, J., Yang, J., & Liu, T. (2023) Alip: Adaptive language-image pre-training with synthetic caption. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 2922\u20132931","DOI":"10.1109\/ICCV51070.2023.00273"},{"key":"2437_CR115","doi-asserted-by":"crossref","unstructured":"Yang, T.-J., Howard, A., Chen, B., Zhang, X., Go, A., Sandler, M., Sze, V., & Adam, H. (2018) Netadapt: Platform-aware neural network adaptation for mobile applications. In: Proceedings of the European conference on computer vision (ECCV), pp. 285\u2013300","DOI":"10.1007\/978-3-030-01249-6_18"},{"key":"2437_CR116","unstructured":"Yang, H., Yin, H., Molchanov, P., Li, H., & Kautz, J. (2021) Nvit: Vision transformer compression and parameter redistribution"},{"issue":"12","key":"2437_CR117","doi-asserted-by":"publisher","first-page":"1551","DOI":"10.1631\/FITEE.2100463","volume":"22","author":"Y Yang","year":"2021","unstructured":"Yang, Y., Zhuang, Y., & Pan, Y. (2021). Multiple knowledge representation for big data artificial intelligence: framework, applications, and case studies. Frontiers of Information Technology & Electronic Engineering, 22(12), 1551\u20131558.","journal-title":"Frontiers of Information Technology & Electronic Engineering"},{"key":"2437_CR118","unstructured":"Yu, J., & Huang, T. (2019) Autoslim: Towards one-shot architecture search for channel numbers. arXiv preprint arXiv:1903.11728"},{"key":"2437_CR119","doi-asserted-by":"crossref","unstructured":"Yu, F., Huang, K., Wang, M., Cheng, Y., Chu, W., & Cui, L. (2022) Width & depth pruning for vision transformers. In AAAI conference on artificial intelligence (AAAI), vol. 2022","DOI":"10.1609\/aaai.v36i3.20222"},{"key":"2437_CR120","unstructured":"Yuan, X., Savarese, P.H.P., & Maire, M. (2020) Growing efficient deep networks by structured continuous sparsification. In International conference on learning representations"},{"key":"2437_CR121","doi-asserted-by":"crossref","unstructured":"Zhang, G., Luo, Z., Tian, Z., Zhang, J., Zhang, X., & Lu, S. (2023) Towards efficient use of multi-scale features in transformer-based object detectors. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 6206\u20136216","DOI":"10.1109\/CVPR52729.2023.00601"},{"key":"2437_CR122","unstructured":"Zhang, Z., Zhang, A., Li, M., Zhao, H., Karypis, G., & Smola, A. (2023) Multimodal chain-of-thought reasoning in language models. arXiv preprint arXiv:2302.00923"},{"key":"2437_CR123","doi-asserted-by":"crossref","unstructured":"Zhao, C., Ni, B., Zhang, J., Zhao, Q., Zhang, W., & Tian, Q. (2019) Variational convolutional neural network pruning. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 2780\u20132789","DOI":"10.1109\/CVPR.2019.00289"},{"key":"2437_CR124","doi-asserted-by":"crossref","unstructured":"Zhou, A., Li, Y., Qin, Z., Liu, J., Pan, J., Zhang, R., Zhao, R., Gao, P., & Li, H. (2023) Sparsemae: Sparse training meets masked autoencoders. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 16176\u201316186","DOI":"10.1109\/ICCV51070.2023.01482"},{"key":"2437_CR125","unstructured":"Zhou, S., Wu, Y., Ni, Z., Zhou, X., Wen, H., & Zou, Y. (2016) Dorefa-net: Training low bitwidth convolutional neural networks with low bitwidth gradients. In Computer vision and pattern recognition (CVPR)"}],"container-title":["International Journal of Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02437-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11263-025-02437-z\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02437-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,6]],"date-time":"2025-09-06T15:23:43Z","timestamp":1757172223000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11263-025-02437-z"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,5,12]]},"references-count":125,"journal-issue":{"issue":"8","published-print":{"date-parts":[[2025,8]]}},"alternative-id":["2437"],"URL":"https:\/\/doi.org\/10.1007\/s11263-025-02437-z","relation":{},"ISSN":["0920-5691","1573-1405"],"issn-type":[{"value":"0920-5691","type":"print"},{"value":"1573-1405","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,5,12]]},"assertion":[{"value":"4 June 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"26 March 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 May 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}