{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:16:31Z","timestamp":1750220191832,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":32,"publisher":"ACM","license":[{"start":{"date-parts":[[2022,9,23]],"date-time":"2022-09-23T00:00:00Z","timestamp":1663891200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62072370"],"award-info":[{"award-number":["62072370"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2022,9,23]]},"DOI":"10.1145\/3573942.3574033","type":"proceedings-article","created":{"date-parts":[[2023,5,16]],"date-time":"2023-05-16T23:45:42Z","timestamp":1684280742000},"page":"353-359","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Object Detection Algorithm Based on Second-Order Pooling Network and Gaussian Mixture Attention"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-8588-8111","authenticated-orcid":false,"given":"Sugang","family":"Ma","sequence":"first","affiliation":[{"name":"School of Computer Science and Technology, Xi'an University of Posts and Telecommunications, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6110-5741","authenticated-orcid":false,"given":"Ningbo","family":"Li","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, Xi'an University of Posts and Telecommunications, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1515-8663","authenticated-orcid":false,"given":"Xiaobao","family":"Yang","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, Xi'an University of Posts and Telecommunications, China"}]}],"member":"320","published-online":{"date-parts":[[2023,5,16]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2022.3185402"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.comcom.2021.10.023"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2022.108796"},{"issue":"04","key":"e_1_3_2_1_4_1","first-page":"1201","article-title":"Deep learning for multi-scale object detection: A Survey[J]","volume":"32","author":"Chen Keqi","year":"2021","unstructured":"Chen Keqi, Zhu Zhiliang, Deng Xiaoming, Deep learning for multi-scale object detection: A Survey[J]. Journal of Software, 2021, 32(04):1201-1227","journal-title":"Journal of Software"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1023\/B:VISI.0000029664.99615.94"},{"key":"e_1_3_2_1_6_1","first-page":"886","article-title":"Histograms of oriented gradients for human detection[C]\/\/2005 IEEE computer society conference on computer vision and pattern recognition (CVPR'05)","volume":"1","author":"Dalal N","year":"2005","unstructured":"Dalal N, Triggs B. Histograms of oriented gradients for human detection[C]\/\/2005 IEEE computer society conference on computer vision and pattern recognition (CVPR'05). Ieee, 2005, 1: 886-893.","journal-title":"Ieee"},{"key":"e_1_3_2_1_7_1","volume-title":"Rich feature hierarchies for accurate object detection and semantic segmentation[C] \/\/Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition","author":"Girshick R","year":"2014","unstructured":"Girshick R, Donahue J, Darrell T, Rich feature hierarchies for accurate object detection and semantic segmentation[C] \/\/Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. Los Alamitos: IEEE Computer Society Press, 2014: 580-587"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2577031"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"crossref","unstructured":"Pang J Chen K Shi J Libra r-cnn: Towards balanced learning for object detection[C]\/\/Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. 2019: 821-830.","DOI":"10.1109\/CVPR.2019.00091"},{"key":"e_1_3_2_1_10_1","volume-title":"You only look once: Unified, real-time object detection[C] \/\/Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition","author":"Redmon J","year":"2016","unstructured":"Redmon J, Divvala S, Girshick R, You only look once: Unified, real-time object detection[C] \/\/Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. Los Alamitos: IEEE Computer Society Press, 2016: 779-788"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"crossref","unstructured":"Redmon J Farhadi A. YOLO9000: better faster stronger[C]\/\/Proceedings of the IEEE conference on computer vision and pattern recognition. 2017: 7263-7271.","DOI":"10.1109\/CVPR.2017.690"},{"key":"e_1_3_2_1_12_1","unstructured":"Redmon J Farhadi A. Yolov3: An incremental improvement[OL]. [2018.4.8]. https:\/\/arxiv.org\/abs\/1804.02767.pdf"},{"key":"e_1_3_2_1_13_1","volume-title":"Liao H Y M. Yolov4: Optimal speed and accuracy of object detection[J]. arXiv preprint arXiv:2004.10934","author":"Bochkovskiy A","year":"2020","unstructured":"Bochkovskiy A, Wang C Y, Liao H Y M. Yolov4: Optimal speed and accuracy of object detection[J]. arXiv preprint arXiv:2004.10934, 2020."},{"key":"e_1_3_2_1_14_1","volume-title":"Wang F","author":"Ge Z","year":"2021","unstructured":"Ge Z, Liu S, Wang F, Yolox: Exceeding yolo series in 2021[OL]. [2021.7.18]. https:\/\/arxiv.org\/abs\/2107.08430.pdf"},{"key":"e_1_3_2_1_15_1","volume-title":"Erhan D","author":"Liu W","year":"2016","unstructured":"Liu W, Anguelov D, Erhan D, SSD: Single shot multibox detector[C] \/\/ Proceedings of European Conference on Computer Vision. Heidelberg: Springer, 2016: 21-37"},{"key":"e_1_3_2_1_16_1","volume-title":"Chen H","author":"Tian Z","year":"2019","unstructured":"Tian Z, Shen C, Chen H, FCOS: Fully convolutional one-stage object detection[C] \/\/Proceedings of the IEEE International Conference on Computer Vision. Los Alamitos: IEEE Computer Society Press, 2019: 9627-9636"},{"key":"e_1_3_2_1_17_1","unstructured":"Zhou Xingyi Wang Dequan KR\u00c4HENB\u00dcHL P. Objects as points[OL]. [2019.5.25]. https:\/\/arxiv.org\/abs\/1904.07850.pdf"},{"key":"e_1_3_2_1_18_1","volume-title":"Advances in Neural Information Processing Systems","author":"Vaswani A","year":"2017","unstructured":"Vaswani A, Shazeer N, Parmar N, Attention is all you need[J]. Advances in Neural Information Processing Systems, 2017, 30"},{"key":"e_1_3_2_1_19_1","volume-title":"End-to-end object detection with transformers[C] \/\/ Proceedings of European Conference on Computer Vision","author":"Carion N","year":"2020","unstructured":"Carion N, Massa F, Synnaeve G, End-to-end object detection with transformers[C] \/\/ Proceedings of European Conference on Computer Vision. Heidelberg: Springer, 2020: 213-229"},{"key":"e_1_3_2_1_20_1","volume-title":"UP-DETR: Unsupervised pre-training for object detection with transformers[C] \/\/Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition","author":"Dai Z","year":"2021","unstructured":"Dai Z, Cai B, Lin Y, UP-DETR: Unsupervised pre-training for object detection with transformers[C] \/\/Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. Los Alamitos: IEEE Computer Society Press, 2021: 1601-1610"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"crossref","unstructured":"Wang H Wang Q Gao M Multi-scale location-aware kernel representation for object detection[C]\/\/Proceedings of the IEEE conference on computer vision and pattern recognition. 2018: 1248-1257.","DOI":"10.1109\/CVPR.2018.00136"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"crossref","unstructured":"Gao Z Xie J Wang Q Global second-order pooling convolutional networks[C]\/\/Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 2019: 3024-3033.","DOI":"10.1109\/CVPR.2019.00314"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"crossref","unstructured":"Chen B Deng W Hu J. Mixed high-order attention network for person re-identification[C]\/\/Proceedings of the IEEE\/CVF international conference on computer vision. 2019: 371-381.","DOI":"10.1109\/ICCV.2019.00046"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"crossref","unstructured":"Li P Xie J Wang Q Is second-order information helpful for large-scale visual recognition?[C]\/\/Proceedings of the IEEE international conference on computer vision. 2017: 2070-2078.","DOI":"10.1109\/ICCV.2017.228"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"crossref","unstructured":"Hu J Shen L Sun G. Squeeze-and-excitation networks[C]\/\/Proceedings of the IEEE conference on computer vision and pattern recognition. 2018: 7132-7141.","DOI":"10.1109\/CVPR.2018.00745"},{"key":"e_1_3_2_1_26_1","volume-title":"Lee J Y","author":"Woo S","year":"2018","unstructured":"Woo S, Park J, Lee J Y, Cbam: Convolutional block attention module[C]\/\/Proceedings of the European conference on computer vision (ECCV). 2018: 3-19."},{"key":"e_1_3_2_1_27_1","volume-title":"Lee J Y","author":"Park J","year":"2018","unstructured":"Park J, Woo S, Lee J Y, BAM: Bottleneck Attention Module[C]\/\/British Machine Vision Conference (BMVC). British Machine Vision Association (BMVA), 2018."},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"crossref","unstructured":"Hou Q Zhou D Feng J. Coordinate attention for efficient mobile network design[C]\/\/Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. 2021: 13713-13722.","DOI":"10.1109\/CVPR46437.2021.01350"},{"volume-title":"IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 2021: 15129-15138","author":"Ruan D","key":"e_1_3_2_1_29_1","unstructured":"Ruan D, Wang D, Zheng Y, Gaussian Context Transformer[C]\/\/Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 2021: 15129-15138."},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.5555\/3157096.3157139"},{"key":"e_1_3_2_1_31_1","first-page":"2980","volume-title":"2017 IEEE International Conference on Computer Vision","year":"2017","unstructured":"LIN T Y, GOYAL P, GIRSHICK R, Focal loss for dense object detection[C]. 2017 IEEE International Conference on Computer Vision, Venice, Italy, 2017: 2980-2988."},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"crossref","unstructured":"Zhou X Zhuo J Krahenbuhl P. Bottom-up object detection by grouping extreme and center points[C]\/\/Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. 2019: 850-859.","DOI":"10.1109\/CVPR.2019.00094"}],"event":{"name":"AIPR 2022: 2022 5th International Conference on Artificial Intelligence and Pattern Recognition","acronym":"AIPR 2022","location":"Xiamen China"},"container-title":["Proceedings of the 2022 5th International Conference on Artificial Intelligence and Pattern Recognition"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3573942.3574033","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3573942.3574033","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T19:02:32Z","timestamp":1750186952000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3573942.3574033"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,9,23]]},"references-count":32,"alternative-id":["10.1145\/3573942.3574033","10.1145\/3573942"],"URL":"https:\/\/doi.org\/10.1145\/3573942.3574033","relation":{},"subject":[],"published":{"date-parts":[[2022,9,23]]},"assertion":[{"value":"2023-05-16","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}