{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,21]],"date-time":"2026-05-21T05:29:38Z","timestamp":1779341378610,"version":"3.51.4"},"reference-count":70,"publisher":"Springer Science and Business Media LLC","issue":"16","license":[{"start":{"date-parts":[[2023,2,27]],"date-time":"2023-02-27T00:00:00Z","timestamp":1677456000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,2,27]],"date-time":"2023-02-27T00:00:00Z","timestamp":1677456000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61601266;61801272"],"award-info":[{"award-number":["61601266;61801272"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100007129","name":"Natural Science Foundation of Shandong Province","doi-asserted-by":"publisher","award":["ZR2021QD041;ZR2020MF127"],"award-info":[{"award-number":["ZR2021QD041;ZR2020MF127"]}],"id":[{"id":"10.13039\/501100007129","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Appl Intell"],"published-print":{"date-parts":[[2023,8]]},"DOI":"10.1007\/s10489-023-04499-3","type":"journal-article","created":{"date-parts":[[2023,2,27]],"date-time":"2023-02-27T21:10:32Z","timestamp":1677532232000},"page":"19199-19216","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":39,"title":["FPANet: feature pyramid attention network for crowd counting"],"prefix":"10.1007","volume":"53","author":[{"given":"Wenzhe","family":"Zhai","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3368-6013","authenticated-orcid":false,"given":"Mingliang","family":"Gao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qilei","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Gwanggil","family":"Jeon","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Marco","family":"Anisetti","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2023,2,27]]},"reference":[{"key":"4499_CR1","doi-asserted-by":"publisher","unstructured":"Abousamra S, Hoai M, Samaras D, Chen C (2021) Localization in the crowd with topological constraints. In: Proceedings of the AAAI conference on artificial intelligence (AAAI), pp 872\u2013881. https:\/\/doi.org\/10.1609\/aaai.v35i2.16170","DOI":"10.1609\/aaai.v35i2.16170"},{"key":"4499_CR2","doi-asserted-by":"publisher","unstructured":"Cao X, Wang Z, Zhao Y, Su F (2018) Scale aggregation network for accurate and efficient crowd counting. In: Proceedings of the European conference on computer vision (ECCV), pp 734\u2013750. https:\/\/doi.org\/10.1007\/978-3-030-01228-1_45","DOI":"10.1007\/978-3-030-01228-1_45"},{"key":"4499_CR3","doi-asserted-by":"publisher","unstructured":"Dai F, Liu H, Ma Y, Zhang X, Zhao Q (2021) Dense scale network for crowd counting. In: Proceedings of the 2021 international conference on multimedia retrieval, pp 64\u201372. https:\/\/doi.org\/10.1145\/3460426.3463628","DOI":"10.1145\/3460426.3463628"},{"key":"4499_CR4","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.neucom.2019.08.018","volume":"363","author":"J Gao","year":"2019","unstructured":"Gao J, Wang Q, Yuan Y (2019) Scar: spatial-\/channel-wise attention regression networks for crowd counting. Neurocomputing 363:1\u20138. https:\/\/doi.org\/10.1016\/j.neucom.2019.08.018","journal-title":"Neurocomputing"},{"key":"4499_CR5","doi-asserted-by":"publisher","first-page":"3486","DOI":"10.1109\/TCSVT.2019.2919139","volume":"30","author":"J Gao","year":"2020","unstructured":"Gao J, Wang Q, Li X (2020) Pcc net: perspective crowd counting via spatial convolutional network. IEEE Trans Circuits Syst Video Technol 30:3486\u20133498. https:\/\/doi.org\/10.1109\/TCSVT.2019.2919139","journal-title":"IEEE Trans Circuits Syst Video Technol"},{"key":"4499_CR6","doi-asserted-by":"publisher","unstructured":"Guo D, Li K, Zha Z, Wang M (2019) Dadnet: dilated-attention-deformable convnet for crowd counting. In: Proceedings of the ACM international conference on multimedia (ACM MM), pp 1823\u20131832. https:\/\/doi.org\/10.1145\/3343031.3350881","DOI":"10.1145\/3343031.3350881"},{"key":"4499_CR7","doi-asserted-by":"publisher","unstructured":"Guo J, Ma X, Sansom A, McGuire M, Kalaani A, Chen Q, Tang S, Yang Q, Fu S (2020) Spanet: spatial pyramid attention network for enhanced image recognition. In: Proceedings of the IEEE international conference on multimedia and expo (ICME), pp 1\u20136. https:\/\/doi.org\/10.1109\/ICME46284.2020.9102906","DOI":"10.1109\/ICME46284.2020.9102906"},{"key":"4499_CR8","doi-asserted-by":"publisher","unstructured":"He K, Zhang X, Ren S, Sun J (2016) Deep residual learning for image recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition (CVPR), pp 770\u2013778. https:\/\/doi.org\/10.1109\/cvpr.2016.90","DOI":"10.1109\/cvpr.2016.90"},{"key":"4499_CR9","doi-asserted-by":"publisher","unstructured":"Hsieh MR, Lin YL, Hsu WH (2017) Drone-based object counting by spatially regularized regional proposal network. In: Proceedings of the international conference on computer vision (ICCV), pp 4165\u20134173. https:\/\/doi.org\/10.1109\/ICCV.2017.446","DOI":"10.1109\/ICCV.2017.446"},{"key":"4499_CR10","doi-asserted-by":"publisher","unstructured":"Hu J, Shen L, Sun G (2018) Squeeze-and-excitation networks. In: Proceedings of the IEEE conference on computer vision and pattern recognition (CVPR), pp 7132\u20137141. https:\/\/doi.org\/10.1109\/TPAMI.2019.2913372","DOI":"10.1109\/TPAMI.2019.2913372"},{"key":"4499_CR11","doi-asserted-by":"publisher","first-page":"1049","DOI":"10.1109\/TIP.2017.2740160","volume":"27","author":"S Huang","year":"2018","unstructured":"Huang S, Li X, Zhang Z, Wu F, Gao S, Ji R, Han J (2018) Body structure aware deep crowd counting. IEEE Trans Image Process 27:1049\u20131059. https:\/\/doi.org\/10.1109\/TIP.2017.2740160","journal-title":"IEEE Trans Image Process"},{"key":"4499_CR12","doi-asserted-by":"publisher","unstructured":"Idrees H, Saleemi I, Seibert C, Shah M (2013) Multi-source multi-scale counting in extremely dense crowd images. In: Proceedings of the IEEE conference on computer vision and pattern recognition (CVPR), pp 2547\u20132554. https:\/\/doi.org\/10.1109\/CVPR.2013.329","DOI":"10.1109\/CVPR.2013.329"},{"key":"4499_CR13","doi-asserted-by":"publisher","unstructured":"Idrees H, Tayyab M, Athrey K, Zhang D, Al-Maadeed S, Rajpoot N, Shah M (2018) Composition loss for counting, density map estimation and localization in dense crowds. In: Proceedings of the European conference on computer vision (ECCV), pp 532\u2013546. https:\/\/doi.org\/10.1007\/978-3-030-01216-8_33","DOI":"10.1007\/978-3-030-01216-8_33"},{"key":"4499_CR14","doi-asserted-by":"publisher","unstructured":"Ioffe S, Szegedy C (2015) Batch normalization: accelerating deep network training by reducing internal covariate shift. In: Proceedings of the international conference on international conference on machine learning (ICML), pp 448\u2013456. https:\/\/doi.org\/10.5555\/3045118.3045167","DOI":"10.5555\/3045118.3045167"},{"key":"4499_CR15","doi-asserted-by":"publisher","unstructured":"Jiang G, Peng J, Wang H, Mi Z, Fu X (2022) Tensorial multi-view clustering via low-rank constrained high-order graph learning. IEEE Trans Circuits Syst Video Technol. https:\/\/doi.org\/10.1109\/TCSVT.2022.3143848","DOI":"10.1109\/TCSVT.2022.3143848"},{"key":"4499_CR16","doi-asserted-by":"publisher","unstructured":"Jiang X, Zhang L, Xu M, Zhang T, Lv P, Zhou B, Yang X, Pang Y (2020) Attention scaling for crowd counting. In: Proceedings of the IEEE conference on computer vision and pattern recognition (CVPR), pp 4705\u20134714. https:\/\/doi.org\/10.1109\/cvpr42600.2020.00476","DOI":"10.1109\/cvpr42600.2020.00476"},{"key":"4499_CR17","doi-asserted-by":"publisher","unstructured":"Kasmani SA, He X, Jia W, Wang D, Zeibots M (2018) A-ccnn: adaptive ccnn for density estimation and crowd counting. In: Proceedings of the IEEE international conference on image processing (ICIP), pp 948\u2013952. https:\/\/doi.org\/10.1109\/ICIP.2018.8451399","DOI":"10.1109\/ICIP.2018.8451399"},{"key":"4499_CR18","unstructured":"Kingma DP, Ba J (2015) Adam: a method for stochastic optimization. In: Proceedings of the international conference on learning representations (ICLR"},{"key":"4499_CR19","doi-asserted-by":"publisher","first-page":"107616","DOI":"10.1016\/j.patcog.2020.107616","volume":"109","author":"Y Lei","year":"2021","unstructured":"Lei Y, Liu Y, Zhang P, Liu L (2021) Towards using count-level weak supervision for crowd counting. Pattern Recognit 109:107616. https:\/\/doi.org\/10.1016\/j.patcog.2020.107616","journal-title":"Pattern Recognit"},{"key":"4499_CR20","doi-asserted-by":"publisher","unstructured":"Li Y, Zhang X, Chen D (2018) Csrnet: dilated convolutional neural networks for understanding the highly congested scenes. In: Proceedings of the IEEE conference on computer vision and pattern recognition (CVPR), pp 1091\u20131100. https:\/\/doi.org\/10.1109\/CVPR.2018.00120","DOI":"10.1109\/CVPR.2018.00120"},{"key":"4499_CR21","doi-asserted-by":"publisher","unstructured":"Li Z, Liu H, Zhang Z, Liu T, Xiong NN (2021) Learning knowledge graph embedding with heterogeneous relation attention networks. IEEE Trans Neural Netw Learn Syst. https:\/\/doi.org\/10.1109\/TNNLS.2021.3055147","DOI":"10.1109\/TNNLS.2021.3055147"},{"key":"4499_CR22","doi-asserted-by":"publisher","first-page":"318","DOI":"10.1109\/TPAMI.2018.2858826","volume":"42","author":"TY Lin","year":"2020","unstructured":"Lin TY, Goyal P, Girshick RB, He K, Doll\u00e1r P (2020) Focal loss for dense object detection. IEEE Trans Pattern Anal Mach Intell 42:318\u2013327. https:\/\/doi.org\/10.1109\/TPAMI.2018.2858826","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"4499_CR23","doi-asserted-by":"publisher","unstructured":"Liu H, Fang S, Zhang Z, Li D, Lin K, Wang J (2021a) Mfdnet: collaborative poses perception and matrix fisher distribution for head pose estimation. IEEE Trans Multimed 24:2449\u20132460. https:\/\/doi.org\/10.1109\/TMM.2021.3081873","DOI":"10.1109\/TMM.2021.3081873"},{"key":"4499_CR24","doi-asserted-by":"publisher","unstructured":"Liu H, Zheng C, Li D, Shen X, Lin K, Wang J, Zhang Z, Zhang Z, Xiong NN (2021b) Edmf: efficient deep matrix factorization with review feature learning for industrial recommender system. IEEE Trans Industr Inf 18(7):4361\u20134371. https:\/\/doi.org\/10.1109\/TII.2021.3128240","DOI":"10.1109\/TII.2021.3128240"},{"key":"4499_CR25","doi-asserted-by":"publisher","unstructured":"Liu H, Liu T, Chen Y, Zhang Z, Li YF (2022a) Ehpe: skeleton cues-based gaussian coordinate encoding for efficient human pose estimation. IEEE Trans Multimed. https:\/\/doi.org\/10.1109\/TMM.2022.3197364","DOI":"10.1109\/TMM.2022.3197364"},{"key":"4499_CR26","doi-asserted-by":"publisher","unstructured":"Liu H, Zheng C, Li D, Zhang Z, Lin K, Shen X, Xiong NN, Wang J (2022b) Multi-perspective social recommendation method with graph representation learning. Neurocomputing 468:469\u2013481. https:\/\/doi.org\/10.1016\/j.neucom.2021.10.050","DOI":"10.1016\/j.neucom.2021.10.050"},{"key":"4499_CR27","doi-asserted-by":"publisher","unstructured":"Liu J, Gao C, Meng D, Hauptmann A (2018) Decidenet: counting varying density crowds through attention guided detection and density estimation. In: Proceedings of the IEEE conference on computer vision and pattern recognition (CVPR), pp 5197\u20135206. https:\/\/doi.org\/10.1109\/CVPR.2018.00545","DOI":"10.1109\/CVPR.2018.00545"},{"key":"4499_CR28","doi-asserted-by":"publisher","unstructured":"Liu L, Jiang J, Jia W, Amirgholipour S, Wang Y, Zeibots M, He X (2021c) Denet: a universal network for counting crowd with varying densities and scales. IEEE Trans Multimed 23:1060\u20131068. https:\/\/doi.org\/10.1109\/TMM.2020.2992979","DOI":"10.1109\/TMM.2020.2992979"},{"key":"4499_CR29","doi-asserted-by":"publisher","unstructured":"Liu T, Wang J, Yang B, Wang X (2021d) Ngdnet: nonuniform gaussian-label distribution learning for infrared head pose estimation and on-task behavior understanding in the classroom. Neurocomputing 436:210\u2013220. https:\/\/doi.org\/10.1016\/j.neucom.2020.12.090","DOI":"10.1016\/j.neucom.2020.12.090"},{"key":"4499_CR30","doi-asserted-by":"publisher","unstructured":"Liu W, Anguelov D, Erhan D, Szegedy C, Reed SE, Fu CY, Berg AC (2016) Ssd: single shot multibox detector. In: Proceedings of the European conference on computer vision (ECCV), pp 21\u201337. https:\/\/doi.org\/10.1007\/978-3-319-46448-0_2","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"4499_CR31","doi-asserted-by":"publisher","unstructured":"Ma YJ, Shuai HH, Cheng WH (2021) Spatiotemporal dilated convolution with uncertain matching for video-based crowd estimation. IEEE Trans Multimed. https:\/\/doi.org\/10.1109\/TMM.2021.3050059","DOI":"10.1109\/TMM.2021.3050059"},{"key":"4499_CR32","doi-asserted-by":"publisher","unstructured":"Ma Z, Wei X, Hong X, Gong Y (2019) Bayesian loss for crowd count estimation with point supervision. In: Proceedings of the international conference on computer vision (ICCV), pp 6141\u20136150. https:\/\/doi.org\/10.1109\/ICCV.2019.00624","DOI":"10.1109\/ICCV.2019.00624"},{"key":"4499_CR33","doi-asserted-by":"publisher","unstructured":"Marsden M, McGuinness K, Little S, O\u2019Connor N (2017) Fully convolutional crowd counting on highly congested scenes. In: Proceedings of the international joint conference on computer vision, imaging and computer graphics theory and applications (VISIGRAPP), pp 27\u201333. https:\/\/doi.org\/10.5220\/0006097300270033","DOI":"10.5220\/0006097300270033"},{"key":"4499_CR34","doi-asserted-by":"publisher","unstructured":"Meng Y, Zhang H, Zhao Y, Yang X, Qian X, Huang X, Zheng Y (2021) Spatial uncertainty-aware semi-supervised crowd counting. In: Proceedings of the international conference on computer vision (ICCV), pp 15549\u201315559. https:\/\/doi.org\/10.1109\/ICCV48922.2021.01526","DOI":"10.1109\/ICCV48922.2021.01526"},{"key":"4499_CR35","doi-asserted-by":"publisher","unstructured":"Nair V, Hinton GE (2010) Rectified linear units improve restricted boltzmann machines. In: Proceedings of the international conference on international conference on machine learning (ICML), pp 807\u2013814. https:\/\/doi.org\/10.5555\/3104322.3104425","DOI":"10.5555\/3104322.3104425"},{"key":"4499_CR36","doi-asserted-by":"publisher","unstructured":"hwan Oh M, Olsen P, Ramamurthy K (2020) Crowd counting with decomposed uncertainty. In: Proceedings of the AAAI conference on artificial intelligence (AAAI), pp 11799\u201311806. https:\/\/doi.org\/10.1609\/AAAI.V34I07.6852","DOI":"10.1609\/AAAI.V34I07.6852"},{"key":"4499_CR37","doi-asserted-by":"publisher","unstructured":"Ranjan V, Le HM, Hoai M (2018) Iterative crowd counting. In: Proceedings of the European conference on computer vision (ECCV), pp 278\u2013293. https:\/\/doi.org\/10.1007\/978-3-030-01234-2_17","DOI":"10.1007\/978-3-030-01234-2_17"},{"key":"4499_CR38","doi-asserted-by":"publisher","first-page":"1137","DOI":"10.1109\/TPAMI.2016.2577031","volume":"39","author":"S Ren","year":"2015","unstructured":"Ren S, He K, Girshick RB, Sun J (2015) Faster r-cnn: towards real-time object detection with region proposal networks. IEEE Trans Pattern Anal Mach Intell 39:1137\u20131149. https:\/\/doi.org\/10.1109\/TPAMI.2016.2577031","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"4499_CR39","doi-asserted-by":"publisher","unstructured":"Sajid U, Sajid H, Wang H, Wang G (2020) Zoomcount: a zooming mechanism for crowd counting in static images. IEEE Trans Circuits Syst Video Technol 30(10):3499\u20133512. https:\/\/doi.org\/10.1109\/TCSVT.2020.2978717","DOI":"10.1109\/TCSVT.2020.2978717"},{"key":"4499_CR40","doi-asserted-by":"publisher","unstructured":"Sam DB, Babu RV (2018) Top-down feedback for crowd counting convolutional neural network. In: Proceedings of the AAAI conference on artificial intelligence (AAAI), pp 7323\u20137330. https:\/\/doi.org\/10.1609\/aaai.v32i1.12290","DOI":"10.1609\/aaai.v32i1.12290"},{"key":"4499_CR41","doi-asserted-by":"publisher","unstructured":"Sam DB, Surya S, Babu RV (2017) Switching convolutional neural network for crowd counting. In: Proceedings of the IEEE conference on computer vision and pattern recognition (CVPR), pp 4031\u20134039. https:\/\/doi.org\/10.1109\/CVPR.2017.429","DOI":"10.1109\/CVPR.2017.429"},{"key":"4499_CR42","doi-asserted-by":"publisher","first-page":"2739","DOI":"10.1109\/tpami.2020.2974830","volume":"43","author":"DB Sam","year":"2021","unstructured":"Sam DB, Peri SV, Sundararaman MN, Kamath A, Babu RV (2021) Locate, size, and count: accurately resolving people in dense crowds via detection. IEEE Trans Pattern Anal Mach Intell 43:2739\u20132751. https:\/\/doi.org\/10.1109\/tpami.2020.2974830","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"4499_CR43","doi-asserted-by":"publisher","unstructured":"Shi Z, Zhang L, Liu Y, Cao X, Ye Y, Cheng MM, Zheng G (2018) Crowd counting with deep negative correlation learning. In: Proceedings of the IEEE conference on computer vision and pattern recognition (CVPR), pp 5382\u20135390. https:\/\/doi.org\/10.1109\/CVPR.2018.00564","DOI":"10.1109\/CVPR.2018.00564"},{"key":"4499_CR44","doi-asserted-by":"publisher","unstructured":"Sindagi V, Patel V (2017a) Cnn-based cascaded multi-task learning of high-level prior and density estimation for crowd counting. In: Proceedings of the IEEE international conference on advanced video and signal based surveillance (AVSS), pp 1\u20136. https:\/\/doi.org\/10.1109\/AVSS.2017.8078491","DOI":"10.1109\/AVSS.2017.8078491"},{"key":"4499_CR45","doi-asserted-by":"publisher","unstructured":"Sindagi V, Patel V (2017b) Generating high-quality crowd density maps using contextual pyramid cnns. In: Proceedings of the international conference on computer vision (ICCV), pp 1879\u20131888. https:\/\/doi.org\/10.1109\/ICCV.2017.206","DOI":"10.1109\/ICCV.2017.206"},{"key":"4499_CR46","doi-asserted-by":"publisher","first-page":"1035","DOI":"10.1109\/TIP.2018.2875353","volume":"28","author":"T Stahl","year":"2019","unstructured":"Stahl T, Pintea SL, Gemert JCV (2019) Divide and count: generic object counting by image divisions. IEEE Trans Image Process 28:1035\u20131044. https:\/\/doi.org\/10.1109\/TIP.2018.2875353","journal-title":"IEEE Trans Image Process"},{"key":"4499_CR47","doi-asserted-by":"publisher","unstructured":"Thanasutives P, Ichi Fukui K, Numao M, Kijsirikul B (2021) Encoder-decoder based convolutional neural networks with multi-scale-aware modules for crowd counting. In: Proceedings of the international conference on pattern recognition (ICPR), pp 2382\u20132389. https:\/\/doi.org\/10.1109\/ICPR48806.2021.9413286","DOI":"10.1109\/ICPR48806.2021.9413286"},{"key":"4499_CR48","doi-asserted-by":"publisher","unstructured":"Tian Z, Shen C, Chen H, He T (2019) Fcos: fully convolutional one-stage object detection. In: Proceedings of the international conference on computer vision (ICCV), pp 9626\u20139635. https:\/\/doi.org\/10.1109\/ICCV.2019.00972","DOI":"10.1109\/ICCV.2019.00972"},{"key":"4499_CR49","doi-asserted-by":"publisher","unstructured":"Wan J, Chan AB (2019) Adaptive density map generation for crowd counting. In: Proceedings of the international conference on computer vision (ICCV), pp 1130\u20131139. https:\/\/doi.org\/10.1109\/ICCV.2019.00122","DOI":"10.1109\/ICCV.2019.00122"},{"key":"4499_CR50","doi-asserted-by":"publisher","unstructured":"Wan J, Wang Q, Chan AB (2020) Kernel-based density map generation for dense object counting. IEEE Trans Pattern Anal Mach Intell:1\u20131. https:\/\/doi.org\/10.1109\/TPAMI.2020.3022878","DOI":"10.1109\/TPAMI.2020.3022878"},{"key":"4499_CR51","doi-asserted-by":"publisher","unstructured":"Wang H, Peng J, Chen D, Jiang G, Zhao T, Fu X (2020a) Attribute-guided feature learning network for vehicle reidentification. IEEE MultiMed 27(4):112\u2013121. https:\/\/doi.org\/10.1109\/MMUL.2020.2999464","DOI":"10.1109\/MMUL.2020.2999464"},{"key":"4499_CR52","doi-asserted-by":"publisher","unstructured":"Wang H, Peng J, Zhao Y, Fu X (2020b) Multi-path deep cnns for fine-grained car recognition. IEEE Trans Vehicular Technol 69(10):10484\u201310493. https:\/\/doi.org\/10.1109\/TVT.2020.3009162","DOI":"10.1109\/TVT.2020.3009162"},{"key":"4499_CR53","doi-asserted-by":"publisher","unstructured":"Wang H, Wang Y, Zhang Z, Fu X, Zhuo L, Xu M, Wang M (2020c) Kernelized multiview subspace analysis by self-weighted learning. IEEE Trans Multimed 23:3828\u20133840. https:\/\/doi.org\/10.1109\/TMM.2020.3032023","DOI":"10.1109\/TMM.2020.3032023"},{"key":"4499_CR54","doi-asserted-by":"publisher","unstructured":"Wang P, Gao C, Wang Y, Li H, Gao Y (2020d) Mobilecount: an efficient encoder-decoder framework for real-time crowd counting. Neurocomputing 407:292\u2013299. https:\/\/doi.org\/10.1016\/j.neucom.2020.05.056","DOI":"10.1016\/j.neucom.2020.05.056"},{"key":"4499_CR55","doi-asserted-by":"publisher","unstructured":"Wang Q, Gao J, Lin W, Yuan Y (2019a) Learning from synthetic data for crowd counting in the wild. In: Proceedings of the IEEE conference on computer vision and pattern recognition (CVPR), pp 8190\u20138199. https:\/\/doi.org\/10.1109\/CVPR.2019.00839","DOI":"10.1109\/CVPR.2019.00839"},{"key":"4499_CR56","doi-asserted-by":"publisher","unstructured":"Wang Q, Wu B, Zhu P, Li P, Zuo W, Hu Q (2020e) Eca-net: efficient channel attention for deep convolutional neural networks. In: Proceedings of the IEEE conference on computer vision and pattern recognition (CVPR), pp 11531\u201311539. https:\/\/doi.org\/10.1109\/CVPR42600.2020.01155","DOI":"10.1109\/CVPR42600.2020.01155"},{"key":"4499_CR57","doi-asserted-by":"publisher","unstructured":"Wang Q, Gao J, Lin W, Li X (2021a) Nwpu-crowd: a large-scale benchmark for crowd counting and localization. IEEE Trans Pattern Anal Mach Intell 43:2141\u20132149. https:\/\/doi.org\/10.1109\/TPAMI.2020.3013269","DOI":"10.1109\/TPAMI.2020.3013269"},{"key":"4499_CR58","doi-asserted-by":"publisher","unstructured":"Wang Q, Han T, Gao J, Yuan Y (2021b) Neuron linear transformation: modeling the domain shift for crowd counting. IEEE Trans Neural Netw Learn Syst:1\u201313. https:\/\/doi.org\/10.1109\/TNNLS.2021.3051371","DOI":"10.1109\/TNNLS.2021.3051371"},{"key":"4499_CR59","doi-asserted-by":"publisher","unstructured":"Wang Y, Hu S, Wang G, Chen C, Pan Z (2019b) Multi-scale dilated convolution of convolutional neural network for crowd counting. Multimed Tools Appl 79:1057\u20131073. https:\/\/doi.org\/10.1007\/s11042-019-08208-6","DOI":"10.1007\/s11042-019-08208-6"},{"key":"4499_CR60","doi-asserted-by":"publisher","unstructured":"Wen L, Du D, Zhu P, Hu Q, Wang Q, Bo L, Lyu S (2021) Detection, tracking, and counting meets drones in crowds: a benchmark. In: Proceedings of the IEEE conference on computer vision and pattern recognition (CVPR), pp 7808\u20137817. https:\/\/doi.org\/10.1109\/CVPR46437.2021.00772","DOI":"10.1109\/CVPR46437.2021.00772"},{"key":"4499_CR61","doi-asserted-by":"publisher","unstructured":"Woo S, Park J, Lee JY, Kweon IS (2018) Cbam: convolutional block attention module. In: Proceedings of the European conference on computer vision (ECCV), pp 3\u201319. https:\/\/doi.org\/10.1007\/978-3-030-01234-2_1","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"4499_CR62","doi-asserted-by":"publisher","unstructured":"Yang X, Yang J, Yan J, Zhang Y, Zhang T, Guo Z, Sun X, Fu K (2019) Scrdet: towards more robust detection for small, cluttered and rotated objects. In: Proceedings of the international conference on computer vision (ICCV), pp 8231\u20138240. https:\/\/doi.org\/10.1109\/ICCV.2019.00832","DOI":"10.1109\/ICCV.2019.00832"},{"key":"4499_CR63","doi-asserted-by":"publisher","unstructured":"Zhai W, Gao M, Anisetti M, Li Q, Jeon S, Pan J (2022a) Group-split attention network for crowd counting. J Electr Imaging 31(4):041214. https:\/\/doi.org\/10.1117\/1.JEI.31.4.041214","DOI":"10.1117\/1.JEI.31.4.041214"},{"key":"4499_CR64","doi-asserted-by":"publisher","unstructured":"Zhai W, Gao M, Souri A, Li Q, Guo X, Shang J, Zou G (2022b) An attentive hierarchy convnet for crowd counting in smart city. Cluster Comput:1\u201313. https:\/\/doi.org\/10.1007\/s10586-022-03749-2","DOI":"10.1007\/s10586-022-03749-2"},{"key":"4499_CR65","doi-asserted-by":"publisher","unstructured":"Zhai W, Li Q, Zhou Y, Li X, Pan J, Zou G, Gao M (2022c) Da2net: a dual attention-aware network for robust crowd counting. Multimed Syst. https:\/\/doi.org\/10.1007\/s00530-021-00877-4","DOI":"10.1007\/s00530-021-00877-4"},{"key":"4499_CR66","doi-asserted-by":"publisher","unstructured":"Zhang C, Li H, Wang X, Yang X (2015) Cross-scene crowd counting via deep convolutional neural networks. In: Proceedings of the IEEE conference on computer vision and pattern recognition (CVPR), pp 833\u2013841. https:\/\/doi.org\/10.1109\/CVPR.2015.7298684","DOI":"10.1109\/CVPR.2015.7298684"},{"key":"4499_CR67","doi-asserted-by":"publisher","unstructured":"Zhang L, Shi M, Chen Q (2018) Crowd counting via scale-adaptive convolutional neural network. In: Proceedings of the IEEE workshop on applications of computer vision (WACV), pp 1113\u20131121. https:\/\/doi.org\/10.1109\/WACV.2018.00127","DOI":"10.1109\/WACV.2018.00127"},{"key":"4499_CR68","doi-asserted-by":"publisher","first-page":"982","DOI":"10.1109\/TPAMI.2019.2943860","volume":"43","author":"L Zhang","year":"2021","unstructured":"Zhang L, Shi Z, Cheng MM, Liu Y, Bian JW, Zhou JT, Zheng G, Zeng Z (2021) Nonlinear regression via deep negative correlation learning. IEEE Trans Pattern Anal Mach Intell 43:982\u2013998. https:\/\/doi.org\/10.1109\/TPAMI.2019.2943860","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"4499_CR69","doi-asserted-by":"publisher","unstructured":"Zhang Y, Zhou D, Chen S, Gao S, Ma Y (2016) Single-image crowd counting via multi-column convolutional neural network. In: Proceedings of the IEEE conference on computer vision and pattern recognition (CVPR), pp 589\u2013597. https:\/\/doi.org\/10.1109\/CVPR.2016.70","DOI":"10.1109\/CVPR.2016.70"},{"key":"4499_CR70","doi-asserted-by":"publisher","first-page":"75","DOI":"10.1016\/j.neucom.2019.08.009","volume":"367","author":"Z Zou","year":"2019","unstructured":"Zou Z, Cheng Y, Qu X, Ji S, Guo X, Zhou P (2019) Attend to count: crowd counting with adaptive capacity multi-scale cnns. Neurocomputing 367:75\u201383. https:\/\/doi.org\/10.1016\/J.NEUCOM.2019.08.009","journal-title":"Neurocomputing"}],"container-title":["Applied Intelligence"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-023-04499-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10489-023-04499-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-023-04499-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,28]],"date-time":"2023-08-28T05:09:02Z","timestamp":1693199342000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10489-023-04499-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,2,27]]},"references-count":70,"journal-issue":{"issue":"16","published-print":{"date-parts":[[2023,8]]}},"alternative-id":["4499"],"URL":"https:\/\/doi.org\/10.1007\/s10489-023-04499-3","relation":{},"ISSN":["0924-669X","1573-7497"],"issn-type":[{"value":"0924-669X","type":"print"},{"value":"1573-7497","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,2,27]]},"assertion":[{"value":"31 January 2023","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 February 2023","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"The authors have no conflict of interest to declare that are relevant to the content of this article.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}}]}}