{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,26]],"date-time":"2026-02-26T07:15:13Z","timestamp":1772090113416,"version":"3.50.1"},"reference-count":50,"publisher":"Springer Science and Business Media LLC","issue":"13","license":[{"start":{"date-parts":[[2021,3,5]],"date-time":"2021-03-05T00:00:00Z","timestamp":1614902400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,3,5]],"date-time":"2021-03-05T00:00:00Z","timestamp":1614902400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61573168"],"award-info":[{"award-number":["61573168"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2021,5]]},"DOI":"10.1007\/s11042-021-10718-1","type":"journal-article","created":{"date-parts":[[2021,3,5]],"date-time":"2021-03-05T05:02:24Z","timestamp":1614920544000},"page":"20283-20305","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":13,"title":["Feature pyramid of bi-directional stepped concatenation for small object detection"],"prefix":"10.1007","volume":"80","author":[{"given":"Qiyuan","family":"Zheng","sequence":"first","affiliation":[]},{"given":"Ying","family":"Chen","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2021,3,5]]},"reference":[{"key":"10718_CR1","doi-asserted-by":"crossref","unstructured":"Bell S, Lawrence Zitnick C, Bala K, Girshick R (2016) Inside-outside net: detecting objects in context with skip pooling and recurrent neural networks. In: Computer vision and pattern recognition, pp 2874\u20132883","DOI":"10.1109\/CVPR.2016.314"},{"issue":"2","key":"10718_CR2","doi-asserted-by":"publisher","first-page":"41","DOI":"10.1109\/MITS.2019.2903525","volume":"11","author":"Z Chen","year":"2019","unstructured":"Chen Z, Zhang Y, Wu C, Ran B (2019) Understanding individualization driving states via latent Dirichlet allocation model. IEEE Intell Transp Syst Mag 11(2):41\u201353","journal-title":"IEEE Intell Transp Syst Mag"},{"key":"10718_CR3","unstructured":"Dai J, Li Y, He K, Sun J (2016) R-FCN: object detection via region-based fully convolutional networks. In: Advances in neural information processing systems, pp 379\u2013387"},{"issue":"6","key":"10718_CR4","doi-asserted-by":"publisher","first-page":"1639","DOI":"10.1109\/TCSVT.2019.2906246","volume":"30","author":"K Duan","year":"2020","unstructured":"Duan K, Du D, Qi H, Huang Q (2020) Detecting small objects using a channel-aware deconvolutional network. IEEE Trans Circ Syst Video Technol 30(6):1639\u20131652","journal-title":"IEEE Trans Circ Syst Video Technol"},{"issue":"2","key":"10718_CR5","doi-asserted-by":"publisher","first-page":"303","DOI":"10.1007\/s11263-009-0275-4","volume":"88","author":"M Everingham","year":"2010","unstructured":"Everingham M, Gool LV, Williams CKI, Winn J, Zisserman A (2010) The pascal visual object classes (voc) challenge. Int J Comput Vis 88 (2):303\u2013338","journal-title":"Int J Comput Vis"},{"key":"10718_CR6","unstructured":"Fu C, Liu W, Ranga A, Tyagi A, Berg AC (2017) DSSD : deconvolutional Single shot detector. In: IEEE conference on computer vision and pattern recognition. arXiv:1701.06659"},{"issue":"9","key":"10718_CR7","first-page":"1904","volume":"37","author":"R Girshick","year":"2013","unstructured":"Girshick R, Donahue J, Darrell T, Malik J, He K, Zhang X, Ren S, Sun J (2013) Rich feature hierarchies for accurate object detection and semantic segmentation. IEEE Trans Pattern Anal Machine Intell 37(9):1904\u20131916","journal-title":"IEEE Trans Pattern Anal Machine Intell"},{"key":"10718_CR8","doi-asserted-by":"crossref","unstructured":"Girshick R (2015) Fast r-cnn. In: Proceedings of the IEEE international conference on computer vision, pp 1440\u20131448","DOI":"10.1109\/ICCV.2015.169"},{"key":"10718_CR9","volume-title":"Advances in soft computing and machine learning in image processing","author":"AE Hassanien","year":"2017","unstructured":"Hassanien AE, Alberto OD (2017) Advances in soft computing and machine learning in image processing. Springer, Berlin"},{"issue":"9","key":"10718_CR10","doi-asserted-by":"publisher","first-page":"1904","DOI":"10.1109\/TPAMI.2015.2389824","volume":"37","author":"K He","year":"2015","unstructured":"He K, Zhang X, Ren S, Sun J (2015) Spatial pyramid pooling in deep convolutional networks for visual recognition. IEEE Trans Pattern Anal Machine Intell 37(9):1904\u20131916","journal-title":"IEEE Trans Pattern Anal Machine Intell"},{"key":"10718_CR11","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J (2016) Deep residual learning for image recognition. In: Computer vision and pattern recognition, pp 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"key":"10718_CR12","unstructured":"Howard AG, Zhu M, Chen B, Kalenichenko D, Wang W, Weyand T, Andreetto M, Adam H (2017) Mobilenets: efficient convolutional neural networks for mobile vision applications. In: IEEE conference on computer vision and pattern recognition. arXiv:1704.04861"},{"key":"10718_CR13","doi-asserted-by":"crossref","unstructured":"Huang G, Liu Z, Maaten LVD, Weinberger KQ (2017) Densely connected convolutional networks. In: Computer vision and pattern recognition, pp 2261\u20132269","DOI":"10.1109\/CVPR.2017.243"},{"key":"10718_CR14","doi-asserted-by":"crossref","unstructured":"Ivanov Y, Peleshko D, Makoveychuk O, Izonin I, Malets I, Lotoshunska N, Batyuk D (2015) Adaptive moving object segmentation algorithms in cluttered environments. In: The experience of designing and application of CAD systems in microelectronics. IEEE, pp 97\u201399","DOI":"10.1109\/CADSM.2015.7230806"},{"key":"10718_CR15","doi-asserted-by":"crossref","unstructured":"Jeong J, Park H, Kwak N (2017) Enhancement of ssd by concatenating feature maps for object detection. In: IEEE conference on computer vision and pattern recognition. arXiv:1705.09587","DOI":"10.5244\/C.31.76"},{"key":"10718_CR16","doi-asserted-by":"crossref","unstructured":"Kim S, Kook HK, Sun JY, Kang MC, Ko S (2018) Parallel feature pyramid network for object detection. In: European conference on computer vision, pp 239\u2013256","DOI":"10.1007\/978-3-030-01228-1_15"},{"key":"10718_CR17","doi-asserted-by":"crossref","unstructured":"Kong T, Yao A, Chen Y, Sun F (2016) Hypernet: towards accurate region proposal generation and joint object detection. In: Computer vision and pattern recognition, pp 845\u2013853","DOI":"10.1109\/CVPR.2016.98"},{"key":"10718_CR18","doi-asserted-by":"crossref","unstructured":"Kong T, Sun F, Yao A, Liu H, Lu M, Chen Y (2017) Ron: reverse connection with objectness prior networks for object detection. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 5936\u20135944","DOI":"10.1109\/CVPR.2017.557"},{"issue":"6","key":"10718_CR19","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1145\/3065386","volume":"60","author":"A Krizhevsky","year":"2017","unstructured":"Krizhevsky A, Sutskever I, Hinton GE (2017) Imagenet classification with deep convolutional neural networks. Communications of The ACM 60(6):84\u201390","journal-title":"Communications of The ACM"},{"key":"10718_CR20","doi-asserted-by":"publisher","first-page":"1113","DOI":"10.1109\/TIP.2019.2936112","volume":"29","author":"Q Lai","year":"2019","unstructured":"Lai Q, Wang W, Sun H, Shen J (2019) Video saliency prediction using spatiotemporal residual attentive networks. IEEE Trans Image Process 29:1113\u20131126","journal-title":"IEEE Trans Image Process"},{"key":"10718_CR21","unstructured":"Li Z, Zhou F (2017) Fssd: feature fusion single shot multibox detector. In: IEEE conference on computer vision and pattern recognition. arXiv:1712.00960"},{"key":"10718_CR22","doi-asserted-by":"crossref","unstructured":"Li X, Wang W, Hu X, Yang J (2019) Selective kernel networks. In: Computer vision and pattern recognition, pp 510\u2013519","DOI":"10.1109\/CVPR.2019.00060"},{"key":"10718_CR23","doi-asserted-by":"crossref","unstructured":"Li Y, Pang Y, Shen J, Cao J, Shao L (2020) NETNet: neighbor erasing and transferring network for better single shot object detection. In: Computer vision and pattern recognition, pp 13349\u201313358","DOI":"10.1109\/CVPR42600.2020.01336"},{"key":"10718_CR24","doi-asserted-by":"crossref","unstructured":"Lin T, Dollar P, Girshick R, He K, Hariharan B, Belongie S (2017) Feature pyramid networks for object detection. In: Computer vision and pattern recognition, pp 936\u2013944","DOI":"10.1109\/CVPR.2017.106"},{"key":"10718_CR25","doi-asserted-by":"crossref","unstructured":"Lin TY, Goyal P, Girshick R, He K, Doll\u00e1r P (2017) Focal loss for dense object detection. In: Proceedings of the IEEE international conference on computer vision, pp. 2980\u20132988","DOI":"10.1109\/ICCV.2017.324"},{"key":"10718_CR26","doi-asserted-by":"crossref","unstructured":"Lin M, Ji R, Wang Y, Zhang Y, Zhang B, Tian Y, Ling S (2020) Hrank: filter pruning using high-rank feature map. In: Computer vision and pattern recognition (CVPR)","DOI":"10.1109\/CVPR42600.2020.00160"},{"key":"10718_CR27","doi-asserted-by":"crossref","unstructured":"Liu W, Anguelov D, Erhan D, Szegedy C, Reed S, Fu C, Berg AC (2016) SSD: single Shot multibox detector. In: European conference on computer vision, pp 21\u201337","DOI":"10.1007\/978-3-319-46448-0_2"},{"issue":"10","key":"10718_CR28","first-page":"1266","volume":"48","author":"YAO Qunli","year":"2019","unstructured":"Qunli YAO, Xian HU, Hong Lei (2019) Aircraft detection in remote sensing imagery with multi-scale feature fusion convolutional neural networks. Acta Geodaetica et Cartographica Sinica 48(10):1266\u20131274","journal-title":"Acta Geodaetica et Cartographica Sinica"},{"issue":"6","key":"10718_CR29","doi-asserted-by":"publisher","first-page":"1137","DOI":"10.1109\/TPAMI.2016.2577031","volume":"39","author":"S Ren","year":"2017","unstructured":"Ren S, He K, Girshick R, Sun J (2017) Faster r-cnn: towards real-time object detection with region proposal networks. IEEE Trans Pattern Anal Mach Intell 39(6):1137\u20131149","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"10718_CR30","doi-asserted-by":"crossref","unstructured":"Redmon J, Divvala SK, Girshick R, Farhadi A (2016) You only look once: unified, real-time object detection. In: Computer vision and pattern recognition, pp 779\u2013788","DOI":"10.1109\/CVPR.2016.91"},{"key":"10718_CR31","doi-asserted-by":"crossref","unstructured":"Redmon J, Farhadi A (2017) Yolo9000: better, faster, stronger. In: Computer vision and pattern recognition, pp 6517\u20136525","DOI":"10.1109\/CVPR.2017.690"},{"key":"10718_CR32","unstructured":"Redmon J, Farhadi A (2018) yolov3: an incremental improvement. In: IEEE conference on computer vision and pattern recognition. arXiv:1804.02767"},{"key":"10718_CR33","doi-asserted-by":"crossref","unstructured":"Shen Z, Liu Z, Li J, Jiang Y, Chen Y, Xue X (2017) Dsod: learning deeply supervised object detectors from scratch. In: International conference on computer vision, pp 1937\u20131945","DOI":"10.1109\/ICCV.2017.212"},{"issue":"7","key":"10718_CR34","doi-asserted-by":"publisher","first-page":"3068","DOI":"10.1109\/TCYB.2019.2936503","volume":"50","author":"J Shen","year":"2019","unstructured":"Shen J, Tang X, Dong X, Shao L (2019) Visual object tracking by hierarchical attention siamese network. IEEE Trans Cybern 50(7):3068\u20133080","journal-title":"IEEE Trans Cybern"},{"issue":"20","key":"10718_CR35","doi-asserted-by":"publisher","first-page":"4276","DOI":"10.3390\/app9204276","volume":"9","author":"W Shi","year":"2019","unstructured":"Shi W, Bao S, Tan D (2019) FFESSD: an accurate and efficient single-shot detector for target detection. Appl Sci 9(20):4276","journal-title":"Appl Sci"},{"key":"10718_CR36","unstructured":"Simonyan K, Zisserman A (2014) Very deep convolutional networks for large-scale image recognition. In: IEEE conference on computer vision and pattern recognition. arXiv:1409.1556"},{"key":"10718_CR37","doi-asserted-by":"crossref","unstructured":"Song H, Wang W, Zhao S, Shen J, Lam K-M (2018) Pyramid dilated deeper convlstm for video salient object detection. In: Proceedings of the European conference on computer vision (ECCV), pp 715\u2013731","DOI":"10.1007\/978-3-030-01252-6_44"},{"issue":"8","key":"10718_CR38","doi-asserted-by":"publisher","first-page":"2014","DOI":"10.1109\/TVCG.2016.2600594","volume":"23","author":"W Wang","year":"2016","unstructured":"Wang W, Shen J, Yu Y, Ma K-L (2016) Stereoscopic thumbnail creation via efficient stereo saliency detection. IEEE Trans Visualization Comput Graphic 23(8):2014\u20132027","journal-title":"IEEE Trans Visualization Comput Graphic"},{"key":"10718_CR39","doi-asserted-by":"crossref","unstructured":"Wang W, Shen J, Cheng M-M, Shao L (2019) An iterative and cooperative top-down and bottom-up inference network for salient object detection. In: Computer vision and pattern recognition, pp 5968\u20135977","DOI":"10.1109\/CVPR.2019.00612"},{"key":"10718_CR40","doi-asserted-by":"crossref","unstructured":"Wang W, Zhao S, Shen J, Hoi SCH, Borji A (2019) Salient object detection with pyramid attention and salient edges. In: Computer vision and pattern recognition, pp 1448\u20131457","DOI":"10.1109\/CVPR.2019.00154"},{"key":"10718_CR41","doi-asserted-by":"crossref","unstructured":"Zhou P, Ni B, Geng C, Hu J, Xu Y (2018) Scale-transferrable object detection. In: Computer vision and pattern recognition, pp 528\u2013537","DOI":"10.1109\/CVPR.2018.00062"},{"key":"10718_CR42","doi-asserted-by":"publisher","first-page":"104812","DOI":"10.1016\/j.ssci.2020.104891","volume":"130","author":"W Wang","year":"2020","unstructured":"Wang W, Shen J, Yu Y, Ma K-L (2020) Deep learning for autonomous ship-oriented small ship detection. Saf Sci 130:104812","journal-title":"Saf Sci"},{"issue":"5","key":"10718_CR43","doi-asserted-by":"publisher","first-page":"2368","DOI":"10.1109\/TIP.2017.2787612","volume":"27","author":"W Wang","year":"2017","unstructured":"Wang W, Shen J (2017) Deep visual attention prediction. IEEE Trans Image Process 27(5):2368\u20132378","journal-title":"IEEE Trans Image Process"},{"key":"10718_CR44","doi-asserted-by":"publisher","unstructured":"Wang W, Shen J, Xie J, Cheng M-M, Ling H, Borji A (2019) Revisiting Video Saliency Prediction in the Deep Learning Era. IEEE Transactions on Pattern Analysis and Machine Intelligence. https:\/\/doi.org\/10.1109\/TPAMI.2019.2924417","DOI":"10.1109\/TPAMI.2019.2924417"},{"issue":"7","key":"10718_CR45","doi-asserted-by":"publisher","first-page":"1531","DOI":"10.1109\/TPAMI.2018.2840724","volume":"41","author":"W Wang","year":"2018","unstructured":"Wang W, Shen J, Ling H (2018) A deep network solution for attention and aesthetics aware photo cropping. IEEE Trans Pattern Anal Mach Intell 41(7):1531\u20131544","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"10718_CR46","doi-asserted-by":"publisher","unstructured":"Wei H, Zhang Y, Wang B, Yang Y, Li H, Wang H (2020) X-linenet: detecting aircraft in remote sensing images by a pair of intersecting line segments. IEEE Transactions on Geoscience and Remote Sensing. https:\/\/doi.org\/10.1109\/TGRS.2020.2999082","DOI":"10.1109\/TGRS.2020.2999082"},{"key":"10718_CR47","doi-asserted-by":"crossref","unstructured":"Zhang S, Wen L, Bian X, Lei Z, Li SZ (2018) Single-shot refinement neural network for object detection. In: Computer vision and pattern recognition, pp 4203\u20134212","DOI":"10.1109\/CVPR.2018.00442"},{"key":"10718_CR48","doi-asserted-by":"crossref","unstructured":"Zhang Z, Qiao S, Xie C, Shen W, Wang B, Yuille AL (2018) Single-shot object detection with enriched semantics. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 5813\u20135821","DOI":"10.1109\/CVPR.2018.00609"},{"key":"10718_CR49","doi-asserted-by":"publisher","first-page":"2789","DOI":"10.1007\/s11063-020-10228-5","volume":"51","author":"H Zhao","year":"2020","unstructured":"Zhao H, Li Z, Fang L, Zhang T (2020) A balanced feature fusion SSD for object detection. Neural Process Lett 51:2789\u20132806. https:\/\/doi.org\/10.1007\/s11063-020-10228-5","journal-title":"Neural Process Lett"},{"key":"10718_CR50","doi-asserted-by":"crossref","unstructured":"Zhu H, Chen X, Dai W, Fu K, Ye Q, Jiao J (2015) Orientation robust object detection in aerial images using deep convolutional neural network. In: International conference on image processing, pp 3735\u20133739","DOI":"10.1109\/ICIP.2015.7351502"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-021-10718-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-021-10718-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-021-10718-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,5,21]],"date-time":"2021-05-21T06:17:42Z","timestamp":1621577862000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-021-10718-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,3,5]]},"references-count":50,"journal-issue":{"issue":"13","published-print":{"date-parts":[[2021,5]]}},"alternative-id":["10718"],"URL":"https:\/\/doi.org\/10.1007\/s11042-021-10718-1","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"value":"1380-7501","type":"print"},{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,3,5]]},"assertion":[{"value":"17 September 2020","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"23 November 2020","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"10 February 2021","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"5 March 2021","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"Thesauthors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"<!--Emphasis Type='Bold' removed-->Conflict of Interests"}}]}}