{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,24]],"date-time":"2025-12-24T18:07:48Z","timestamp":1766599668664,"version":"3.37.3"},"reference-count":43,"publisher":"Springer Science and Business Media LLC","issue":"9","license":[{"start":{"date-parts":[[2022,3,3]],"date-time":"2022-03-03T00:00:00Z","timestamp":1646265600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,3,3]],"date-time":"2022-03-03T00:00:00Z","timestamp":1646265600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100004663","name":"Ministry of Science and Technology, Taiwan","doi-asserted-by":"publisher","award":["109-2637-E-167 -004 -"],"award-info":[{"award-number":["109-2637-E-167 -004 -"]}],"id":[{"id":"10.13039\/501100004663","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2022,4]]},"DOI":"10.1007\/s11042-021-11897-7","type":"journal-article","created":{"date-parts":[[2022,3,3]],"date-time":"2022-03-03T05:03:49Z","timestamp":1646283829000},"page":"11917-11929","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Multi-fusion feature pyramid for real-time hand detection"],"prefix":"10.1007","volume":"81","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-5010-2767","authenticated-orcid":false,"given":"Chuan-Wang","family":"Chang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Santanu","family":"Santra","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jun-Wei","family":"Hsieh","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Pirdiansyah","family":"Hendri","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chi-Fang","family":"Lin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2022,3,3]]},"reference":[{"key":"11897_CR1","doi-asserted-by":"publisher","first-page":"1949","DOI":"10.1109\/ICCV.2015.226","volume-title":"2015 IEEE International Conference on Computer Vision (ICCV)","author":"S Bambach","year":"2015","unstructured":"Bambach S, Lee S, Crandall DJ, Yu C (2015) Lending A Hand: Detecting Hands and Recognizing Activities in Complex Egocentric Interactions. In: 2015 IEEE International Conference on Computer Vision (ICCV), pp 1949\u20131957"},{"key":"11897_CR2","volume-title":"YOLOv4: optimal speed and accuracy of object detection","author":"A Bochkovskiy","year":"2020","unstructured":"A. Bochkovskiy, C.-Y. Wang, and H.-Y. M. Liao, \u201cYOLOv4: optimal speed and accuracy of object detection,\u201d 2020."},{"key":"11897_CR3","first-page":"1","volume-title":"Br. Mach. Vis. Conf. 2018, BMVC 2018","author":"B Bosquet","year":"2019","unstructured":"Bosquet B, Mucientes M, Brea VM (2019) StDNet: A convnet for small target detection. In: Br. Mach. Vis. Conf. 2018, BMVC 2018, pp 1\u201312"},{"issue":"8","key":"11897_CR4","doi-asserted-by":"publisher","first-page":"1562","DOI":"10.1109\/TIM.2008.922070","volume":"57","author":"Q Chen","year":"2008","unstructured":"Chen Q, Georganas ND, Petriu EM (2008) Hand gesture recognition using Haar-like features and a stochastic context-free grammar. IEEE Trans Instrum Meas 57(8):1562\u20131571","journal-title":"IEEE Trans Instrum Meas"},{"issue":"3","key":"11897_CR5","doi-asserted-by":"publisher","first-page":"403","DOI":"10.1109\/THMS.2015.2492598","volume":"46","author":"MY Chen","year":"2016","unstructured":"Chen MY, Alregib G, Juang B-H (2016) Air-writing recognition-part I: modeling and recognition of characters, words, and connecting motions. IEEE Trans on Human-Machine Systems 46(3):403\u2013413","journal-title":"IEEE Trans on Human-Machine Systems"},{"issue":"3","key":"11897_CR6","doi-asserted-by":"publisher","first-page":"403","DOI":"10.1109\/THMS.2015.2492598","volume":"46","author":"M Chen","year":"2016","unstructured":"Chen M, AlRegib G, Juang BH (2016) Air-writing recognition - part I: modeling and recognition of characters, words, and connecting motions. IEEE Trans Human-Machine Syst 46(3):403\u2013413","journal-title":"IEEE Trans Human-Machine Syst"},{"issue":"11","key":"11897_CR7","doi-asserted-by":"publisher","first-page":"3592","DOI":"10.1109\/TIM.2011.2161140","volume":"60","author":"NH Dardas","year":"2011","unstructured":"Dardas NH, Georganas ND (2011) Real-time hand gesture detection and recognition using bag-of-features and support vector machine techniques. IEEE Trans Instrum Meas 60(11):3592\u20133607","journal-title":"IEEE Trans Instrum Meas"},{"issue":"4","key":"11897_CR8","doi-asserted-by":"publisher","first-page":"1888","DOI":"10.1109\/TIP.2017.2779600","volume":"27","author":"X Deng","year":"2018","unstructured":"Deng X, Zhang Y, Yang S, Tan P, Chang L, Yuan Y, Wang H (2018) Joint hand detection and rotation estimation using CNN. IEEE Trans Image Process 27(4):1888\u20131900","journal-title":"IEEE Trans Image Process"},{"issue":"9","key":"11897_CR9","doi-asserted-by":"publisher","first-page":"1627","DOI":"10.1109\/TPAMI.2009.167","volume":"32","author":"PF Felzenszwalb","year":"2010","unstructured":"Felzenszwalb PF, Girshick RB, McAllester D, Ramanan D (2010) Object detection with discriminatively trained part-based models. IEEE Trans Pattern Anal Mach Intell 32(9):1627\u20131645","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"11897_CR10","doi-asserted-by":"publisher","first-page":"580","DOI":"10.1109\/CVPR.2014.81","volume-title":"2014 IEEE Conference on Computer Vision and Pattern Recognition","author":"R Girshick","year":"2014","unstructured":"Girshick R, Donahue J, Darrell T, Malik J (2014) Rich Feature Hierarchies for Accurate Object Detection and Semantic Segmentation. In: 2014 IEEE Conference on Computer Vision and Pattern Recognition, pp 580\u2013587"},{"key":"11897_CR11","doi-asserted-by":"crossref","unstructured":"Gupta L, Ma S (2001) Gesture-based interaction and communication: automated classification of hand gesture contours. IEEE Trans. Syst. Man, Cybern. Part C Applications Rev, 31(1):114\u2013120","DOI":"10.1109\/5326.923274"},{"issue":"5","key":"11897_CR12","doi-asserted-by":"publisher","first-page":"1318","DOI":"10.1109\/TCYB.2013.2265378","volume":"43","author":"J Han","year":"2013","unstructured":"Han J, Shao L, Xu D, Shotton J (2013) Enhanced computer vision with Microsoft Kinect sensor: a review. IEEE Trans Cybern 43(5):1318\u20131334","journal-title":"IEEE Trans Cybern"},{"issue":"9","key":"11897_CR13","doi-asserted-by":"publisher","first-page":"1904","DOI":"10.1109\/TPAMI.2015.2389824","volume":"37","author":"K He","year":"2015","unstructured":"He K, Zhang X, Ren S, Sun J (2015) Spatial pyramid pooling in deep convolutional networks for visual recognition. IEEE Trans Pattern Anal Mach Intell 37(9):1904\u20131916","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"11897_CR14","doi-asserted-by":"crossref","unstructured":"K. He, G. Gkioxari, P. Dollar, and R. Girshick, \u201cMask R-CNN,\u201d 2017, pp. 2980\u20132988.","DOI":"10.1109\/ICCV.2017.322"},{"issue":"5","key":"11897_CR15","doi-asserted-by":"publisher","first-page":"1034","DOI":"10.1109\/TSMCC.2007.900624","volume":"37","author":"I Infantino","year":"2007","unstructured":"Infantino I, Rizzo R, Gaglio S (2007) A framework for sign language sentence recognition by commonsense context. IEEE Trans. Syst. Man, Cybern. Part C Applications Rev. 37(5):1034\u20131039","journal-title":"IEEE Trans. Syst. Man, Cybern. Part C Applications Rev."},{"key":"11897_CR16","doi-asserted-by":"crossref","unstructured":"S.-W. Kim, H.-K. Kook, J.-Y. Sun, M.-C. Kang, and S.-J. Ko, \u201cParallel Feature Pyramid Network for Object Detection: 15th European Conference, Munich, Germany, September 8\u201314, 2018, Proceedings, Part V,\u201d 2018, pp. 239\u2013256.","DOI":"10.1007\/978-3-030-01228-1_15"},{"key":"11897_CR17","doi-asserted-by":"publisher","first-page":"614","DOI":"10.1109\/AFGR.2004.1301601","volume-title":"Sixth IEEE International Conference on Automatic Face and Gesture Recognition, 2004","author":"M Kolsch","year":"2004","unstructured":"Kolsch M, Turk M (2004) Robust hand detection. In: Sixth IEEE International Conference on Automatic Face and Gesture Recognition, 2004. Proceedings, pp 614\u2013619"},{"key":"11897_CR18","doi-asserted-by":"crossref","unstructured":"Law H, Deng J (2019) CornerNet: detecting objects as paired Keypoints. Int. J. Comput. Vis","DOI":"10.1007\/s11263-019-01204-1"},{"key":"11897_CR19","first-page":"1203","volume-title":"IEEE Comput. Soc. Conf. Comput. Vis. Pattern Recognit. Work., vol. 2017-July","author":"THN Le","year":"2017","unstructured":"Le THN, Quach KG, Zhu C, Duong CN, Luu K, Savvides M (2017) Robust Hand Detection and Classification in Vehicles and in the Wild. In: IEEE Comput. Soc. Conf. Comput. Vis. Pattern Recognit. Work., vol. 2017-July, pp 1203\u20131210"},{"issue":"12","key":"11897_CR20","doi-asserted-by":"publisher","first-page":"4696","DOI":"10.1109\/JSEN.2019.2901259","volume":"19","author":"TH Le","year":"2019","unstructured":"Le TH, Huang SC, Jaw DW (2019) Cross-resolution feature fusion for fast hand detection in intelligent homecare systems. IEEE Sensors J 19(12):4696\u20134704","journal-title":"IEEE Sensors J"},{"key":"11897_CR21","volume-title":"Microsoft COCO: common objects in context","author":"T-Y Lin","year":"2014","unstructured":"Lin T-Y et al (2014) Microsoft COCO: common objects in context"},{"key":"11897_CR22","doi-asserted-by":"publisher","first-page":"936","DOI":"10.1109\/CVPR.2017.106","volume-title":"2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"T Lin","year":"2017","unstructured":"Lin T, Doll\u00e1r P, Girshick R, He K, Hariharan B, Belongie S (2017) Feature Pyramid Networks for Object Detection. In: 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp 936\u2013944"},{"key":"11897_CR23","first-page":"2999","volume-title":"Proc. IEEE Int. Conf. Comput. Vis., vol. 2017-Octob","author":"TY Lin","year":"2017","unstructured":"Lin TY, Goyal P, Girshick R, He K, Dollar P (2017) Focal Loss for Dense Object Detection. In: Proc. IEEE Int. Conf. Comput. Vis., vol. 2017-Octob, pp 2999\u20133007"},{"key":"11897_CR24","first-page":"21","volume-title":"Lect. Notes Comput. Sci. (including Subser. Lect. Notes Artif. Intell. Lect. Notes Bioinformatics), vol. 9905 LNCS","author":"W Liu","year":"2016","unstructured":"Liu W et al (2016) SSD: Single shot multibox detector. In: Lect. Notes Comput. Sci. (including Subser. Lect. Notes Artif. Intell. Lect. Notes Bioinformatics), vol. 9905 LNCS, pp 21\u201337"},{"key":"11897_CR25","doi-asserted-by":"crossref","unstructured":"Lun R, Zhao W (2015) A Survey of Applications and Human Motion Recognition with Microsoft Kinect. 29(5)","DOI":"10.1142\/S0218001415550083"},{"key":"11897_CR26","doi-asserted-by":"crossref","unstructured":"Mei K, Xu L, Li B, Lin B, Wang F (2015) A Real-time Hand Detection System Based on Multi-feature. Neurocomputing 158","DOI":"10.1016\/j.neucom.2015.01.049"},{"issue":"3","key":"11897_CR27","doi-asserted-by":"publisher","first-page":"311","DOI":"10.1109\/TSMCC.2007.893280","volume":"37","author":"S Mitra","year":"2007","unstructured":"Mitra S, Acharya T (2007) Gesture recognition: a survey. IEEE Trans Syst Man, Cybern Part C Applications Rev 37(3):311\u2013324","journal-title":"IEEE Trans Syst Man, Cybern Part C Applications Rev"},{"key":"11897_CR28","doi-asserted-by":"crossref","unstructured":"A. Mittal, A. Zisserman, and P. Torr, \u201cHand detection using multiple proposals,\u201d pp. 75.1\u201375.11, 2011.","DOI":"10.5244\/C.25.75"},{"key":"11897_CR29","first-page":"93","volume-title":"Proc. ofInternational Conf. Comput. Vis. Image Process. Adv. Intell. Syst. Comput., vol. 460 AISC","author":"A Mohanty","year":"2017","unstructured":"Mohanty A, Ahmed A, Goswami T, Das A, Vaishnavi P, Sahay RR (2017) Robust Pose Recognition Using Deep Learning. In: Proc. ofInternational Conf. Comput. Vis. Image Process. Adv. Intell. Syst. Comput., vol. 460 AISC, pp 93\u2013105"},{"key":"11897_CR30","volume-title":"A boosted classifier tree for hand shape detection","author":"E-J Ong","year":"2004","unstructured":"E.-J. Ong and R. Bowden, \u201cA boosted classifier tree for hand shape detection,\u201d 2004."},{"key":"11897_CR31","first-page":"6517","volume-title":"Proc. - 30th IEEE Conf. Comput. Vis. Pattern Recognition, CVPR 2017, vol. 2017-Janua","author":"J Redmon","year":"2017","unstructured":"Redmon J, Farhadi A (2017) YOLO9000: Better, faster, stronger. In: Proc. - 30th IEEE Conf. Comput. Vis. Pattern Recognition, CVPR 2017, vol. 2017-Janua, pp 6517\u20136525"},{"key":"11897_CR32","unstructured":"J. Redmon and A. Farhadi, \u201cYOLOv3: An Incremental Improvement,\u201d 2018."},{"key":"11897_CR33","first-page":"779","volume-title":"Proc. IEEE Comput. Soc. Conf. Comput. Vis. Pattern Recognit., vol. 2016-Decem","author":"J Redmon","year":"2016","unstructured":"Redmon J, Divvala S, Girshick R, Farhadi A (2016) You only look once: Unified, real-time object detection. In: Proc. IEEE Comput. Soc. Conf. Comput. Vis. Pattern Recognit., vol. 2016-Decem, pp 779\u2013788"},{"issue":"6","key":"11897_CR34","doi-asserted-by":"publisher","first-page":"1137","DOI":"10.1109\/TPAMI.2016.2577031","volume":"39","author":"S Ren","year":"2017","unstructured":"Ren S, He K, Girshick R, Sun J (2017) Faster R-CNN: towards real-time object detection with region proposal networks. IEEE Trans Pattern Anal Mach Intell 39(6):1137\u20131149","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"11897_CR35","first-page":"640","volume-title":"Proc. - 2017 IEEE Int. Conf. Comput. Vis. Work. ICCVW 2017, vol. 2018-Janua","author":"K Roy","year":"2018","unstructured":"Roy K, Mohanty A, Sahay RR (2018) Deep Learning Based Hand Detection in Cluttered Environment Using Skin Segmentation. In: Proc. - 2017 IEEE Int. Conf. Comput. Vis. Work. ICCVW 2017, vol. 2018-Janua, pp 640\u2013649"},{"key":"11897_CR36","first-page":"1","volume-title":"3rd Int. Conf. Learn. Represent. ICLR 2015 - Conf. Track Proc","author":"K Simonyan","year":"2015","unstructured":"Simonyan K, Zisserman A (2015) Very deep convolutional networks for large-scale image recognition. In: 3rd Int. Conf. Learn. Represent. ICLR 2015 - Conf. Track Proc, pp 1\u201314"},{"key":"11897_CR37","volume-title":"Ubi-Media 2017 - Proc. 10th Int. Conf. Ubi-Media Comput. Work. with 4th Int. Work. Adv. E-Learning 1st Int. Work. Multimed. IoT Networks, Syst. Appl","author":"TH Tsai","year":"2017","unstructured":"Tsai TH, Hsieh JW, Chen HC, Huang SC (2017) Reverse time ordered stroke context for air-writing recognition. In: Ubi-Media 2017 - Proc. 10th Int. Conf. Ubi-Media Comput. Work. with 4th Int. Work. Adv. E-Learning 1st Int. Work. Multimed. IoT Networks, Syst. Appl"},{"key":"11897_CR38","unstructured":"R. Wang, X. Li, S. Ao, and C. Ling, \u201cPelee: a real-time object detection system on Mobile devices,\u201d 2018."},{"key":"11897_CR39","first-page":"400","volume-title":"Proc. IEEE Comput. Soc. Conf. Comput. Vis. Pattern Recognit., vol. 07\u201312-June, no. c","author":"Y Yang","year":"2015","unstructured":"Yang Y, Ferm\u00fcller C, Li Y, Aloimonos Y (2015) Grasp type revisited: A modern perspective on a classical feature for vision. In: Proc. IEEE Comput. Soc. Conf. Comput. Vis. Pattern Recognit., vol. 07\u201312-June, no. c, pp 400\u2013408"},{"issue":"6","key":"11897_CR40","doi-asserted-by":"publisher","first-page":"1064","DOI":"10.1109\/TSMCA.2011.2116004","volume":"41","author":"X Zhang","year":"2011","unstructured":"Zhang X, Chen X, Li Y, Lantz V, Wang K, Yang J (2011) A framework for hand gesture recognition based on accelerometer and EMG sensors. IEEE Trans Syst Man, Cybern - Part A Syst Humans 41(6):1064\u20131076","journal-title":"IEEE Trans Syst Man, Cybern - Part A Syst Humans"},{"issue":"4","key":"11897_CR41","doi-asserted-by":"publisher","first-page":"85","DOI":"10.1109\/MMUL.2013.50","volume":"20","author":"X Zhang","year":"2013","unstructured":"Zhang X, Ye Z, Jin L, Feng Z, Xu S (2013) A new writing experience: finger writing in the air using a kinect sensor. IEEE Multimed 20(4):85\u201393","journal-title":"IEEE Multimed"},{"key":"11897_CR42","first-page":"192","volume-title":"2015 IEEE 14th International Conference on Cognitive Informatics Cognitive Computing (ICCI*CC)","author":"L Zhang","year":"2015","unstructured":"Zhang L, Wu X, Luo D (2015) Human activity recognition with HMM-DNN model. In: 2015 IEEE 14th International Conference on Cognitive Informatics Cognitive Computing (ICCI*CC), pp 192\u2013197"},{"key":"11897_CR43","first-page":"9259","volume":"33","author":"Q Zhao","year":"2019","unstructured":"Zhao Q et al (2019) M2Det: a single-shot object detector based on multi-level feature pyramid network. Proc AAAI Conf Artif Intell 33:9259\u20139266","journal-title":"Proc AAAI Conf Artif Intell"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-021-11897-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-021-11897-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-021-11897-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,4,13]],"date-time":"2022-04-13T20:01:56Z","timestamp":1649880116000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-021-11897-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,3,3]]},"references-count":43,"journal-issue":{"issue":"9","published-print":{"date-parts":[[2022,4]]}},"alternative-id":["11897"],"URL":"https:\/\/doi.org\/10.1007\/s11042-021-11897-7","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"type":"print","value":"1380-7501"},{"type":"electronic","value":"1573-7721"}],"subject":[],"published":{"date-parts":[[2022,3,3]]},"assertion":[{"value":"31 March 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 October 2021","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"23 December 2021","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 March 2022","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}