{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,21]],"date-time":"2026-03-21T08:18:55Z","timestamp":1774081135956,"version":"3.50.1"},"reference-count":153,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2021,4,1]],"date-time":"2021-04-01T00:00:00Z","timestamp":1617235200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2021,4,1]],"date-time":"2021-04-01T00:00:00Z","timestamp":1617235200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"}],"funder":[{"DOI":"10.13039\/501100000780","name":"European Commission","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100000780","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Information Fusion"],"published-print":{"date-parts":[[2021,4]]},"DOI":"10.1016\/j.inffus.2020.11.002","type":"journal-article","created":{"date-parts":[[2020,11,19]],"date-time":"2020-11-19T22:36:13Z","timestamp":1605825373000},"page":"161-191","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":233,"special_numbering":"C","title":["Point-cloud based 3D object detection and classification methods for self-driving applications: A survey and taxonomy"],"prefix":"10.1016","volume":"68","author":[{"given":"Duarte","family":"Fernandes","sequence":"first","affiliation":[]},{"given":"Ant\u00f3nio","family":"Silva","sequence":"additional","affiliation":[]},{"given":"Rafael","family":"N\u00e9voa","sequence":"additional","affiliation":[]},{"given":"Cl\u00e1udia","family":"Sim\u00f5es","sequence":"additional","affiliation":[]},{"given":"Dibet","family":"Gonzalez","sequence":"additional","affiliation":[]},{"given":"Miguel","family":"Guevara","sequence":"additional","affiliation":[]},{"given":"Paulo","family":"Novais","sequence":"additional","affiliation":[]},{"given":"Jo\u00e3o","family":"Monteiro","sequence":"additional","affiliation":[]},{"given":"Pedro","family":"Melo-Pinto","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/j.inffus.2020.11.002_bib0001","article-title":"Global status report on road safety","author":"Ghebreyesus","year":"2018","journal-title":"Geneva"},{"issue":"5","key":"10.1016\/j.inffus.2020.11.002_bib0002","doi-asserted-by":"crossref","first-page":"327","DOI":"10.1093\/inthealth\/ihz042","article-title":"Looking back on 10 years of global road safety","volume":"11","author":"Peden","year":"2019","journal-title":"Int. Health"},{"issue":"2","key":"10.1016\/j.inffus.2020.11.002_bib0003","doi-asserted-by":"crossref","first-page":"315","DOI":"10.1111\/risa.13116","article-title":"How safe is safe enough for self-driving vehicles?","volume":"39","author":"Liu","year":"2019","journal-title":"Risk Anal."},{"issue":"9","key":"10.1016\/j.inffus.2020.11.002_bib0004","doi-asserted-by":"crossref","first-page":"e390","DOI":"10.1016\/S2542-5196(19)30170-6","article-title":"The global macroeconomic burden of road injuries: estimates and projections for 166 countries","volume":"3","author":"Chen","year":"2019","journal-title":"Lancet Planet. Heal."},{"key":"10.1016\/j.inffus.2020.11.002_bib0005","unstructured":"T.Litman, \u201cAutonomous vehicle implementation predictions implications for transport planning,\u201d Victoria, Canada, 2020. [Online]. Available: https:\/\/www.vtpi.org\/avip.pdf."},{"key":"10.1016\/j.inffus.2020.11.002_bib0006","doi-asserted-by":"crossref","unstructured":"Society of Automotive Engineers, \u201cSAE Standards News: J3016 automated-driving graphic update,\u201d United States, 2019. doi: https:\/\/doi.org\/10.4271\/J3016_201806.","DOI":"10.4271\/J3016_201806"},{"key":"10.1016\/j.inffus.2020.11.002_bib0007","doi-asserted-by":"crossref","first-page":"323","DOI":"10.1016\/j.arcontrol.2017.09.012","article-title":"Perception, information processing and modeling: Critical stages for autonomous driving applications","volume":"44","author":"Gruyer","year":"2017","journal-title":"Annu. Rev. Control"},{"key":"10.1016\/j.inffus.2020.11.002_bib0008","doi-asserted-by":"crossref","DOI":"10.1016\/j.trc.2018.02.012","article-title":"Autonomous vehicle perception: The technology of today and tomorrow","volume":"89","author":"Van Brummelen","year":"2018","journal-title":"Transp. Res. Part C Emerg. Technol."},{"issue":"1","key":"10.1016\/j.inffus.2020.11.002_bib0009","doi-asserted-by":"crossref","first-page":"6","DOI":"10.3390\/machines5010006","article-title":"Perception, planning, control, and coordination for autonomous vehicles","volume":"5","author":"Pendleton","year":"2017","journal-title":"Machines"},{"key":"10.1016\/j.inffus.2020.11.002_bib0010","article-title":"PointRCNN: 3D object proposal generation and detection from point cloud","author":"Shi","year":"2018","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0011","series-title":"Proc. IEEE Int. Conf. Comput. Vis.","first-page":"1440","article-title":"Fast R-CNN","author":"Girshick","year":"2015"},{"issue":"6","key":"10.1016\/j.inffus.2020.11.002_bib0012","doi-asserted-by":"crossref","first-page":"1137","DOI":"10.1109\/TPAMI.2016.2577031","article-title":"Faster R-CNN: towards real-time object detection with region proposal networks","volume":"39","author":"Ren","year":"2017","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"10","key":"10.1016\/j.inffus.2020.11.002_bib0013","doi-asserted-by":"crossref","first-page":"3782","DOI":"10.1109\/TITS.2019.2892405","article-title":"A survey on 3D object detection methods for autonomous driving applications","volume":"20","author":"Arnold","year":"2019","journal-title":"IEEE Trans. Intell. Transp. Syst."},{"key":"10.1016\/j.inffus.2020.11.002_bib0014","series-title":"ESSCIRC 2006 - Proc. 32nd Eur. Solid-State Circuits Conf.","first-page":"568","article-title":"A 64\u00d78 Pixel 3-D CMOS time of flight image sensor for car safety applications","author":"Elkhalili","year":"2006"},{"issue":"3","key":"10.1016\/j.inffus.2020.11.002_bib0015","doi-asserted-by":"crossref","first-page":"128837","DOI":"10.1109\/ACCESS.2019.2939201","article-title":"A survey of deep learning-based object detection","volume":"7","author":"Jiao","year":"2019","journal-title":"IEEE Access"},{"key":"10.1016\/j.inffus.2020.11.002_bib0016","article-title":"Deep learning for 3D point clouds: a survey","author":"Guo","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"issue":"19","key":"10.1016\/j.inffus.2020.11.002_bib0017","doi-asserted-by":"crossref","first-page":"4188","DOI":"10.3390\/s19194188","article-title":"Deep learning on point clouds and its application: a survey","volume":"19","author":"Liu","year":"2019","journal-title":"Sensors"},{"key":"10.1016\/j.inffus.2020.11.002_bib0018","article-title":"A review on deep learning techniques for 3D sensed data classification","author":"Griffiths","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"issue":"2","key":"10.1016\/j.inffus.2020.11.002_bib0019","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3042064","article-title":"Deep learning advances in computer vision with 3D data","volume":"50","author":"Ioannidou","year":"2017","journal-title":"ACM Comput. Surv."},{"key":"10.1016\/j.inffus.2020.11.002_bib0020","doi-asserted-by":"crossref","first-page":"2947","DOI":"10.1109\/TIP.2019.2955239","article-title":"Recent advances in 3D object detection in the era of deep neural networks: a survey","volume":"29","author":"Rahman","year":"2020","journal-title":"IEEE Trans. Image Process."},{"key":"10.1016\/j.inffus.2020.11.002_bib0021","article-title":"Recent advances in deep learning for object detection","author":"Wu","year":"2019","journal-title":"Neurocomputing"},{"key":"10.1016\/j.inffus.2020.11.002_bib0022","article-title":"Recent advances in convolutional neural networks","author":"Gu","year":"2015","journal-title":"Comput. Vis. Pattern"},{"key":"10.1016\/j.inffus.2020.11.002_bib0023","doi-asserted-by":"crossref","first-page":"634","DOI":"10.1007\/978-3-319-10599-4_41","article-title":"Sliding shapes for 3D object detection in depth images","author":"Song","year":"2014","journal-title":"Computer Vision \u2013 ECCV 2014"},{"key":"10.1016\/j.inffus.2020.11.002_bib0024","doi-asserted-by":"crossref","unstructured":"M.Engelcke, D.Rao, D. Z.Wang, C. H.Tong, and I.Posner, \u201cVote3deep: fast object detection in 3D point clouds using efficient convolutional neural networks,\u201d 2017.","DOI":"10.1109\/ICRA.2017.7989161"},{"key":"10.1016\/j.inffus.2020.11.002_bib0025","first-page":"4490","article-title":"VoxelNet: end-to-end learning for point cloud based 3D object detection","author":"Zhou","year":"2018","journal-title":"Proc. IEEE Comput. Soc. Conf. Comput. Vis. Pattern Recognit."},{"issue":"7","key":"10.1016\/j.inffus.2020.11.002_bib0026","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1115\/1.4043222","article-title":"Multimodal fusion object detection system for autonomous vehicles","volume":"141","author":"Person","year":"2019","journal-title":"J. Dyn. Syst. Meas. Control. Trans. ASME"},{"key":"10.1016\/j.inffus.2020.11.002_bib0027","first-page":"1","article-title":"Class-balanced grouping and sampling for point cloud 3D object detection","author":"Zhu","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0028","article-title":"3D fully convolutional network for vehicle detection in point cloud","author":"Li","year":"2016","journal-title":"Comput. Vis. Pattern Recognit."},{"issue":"10","key":"10.1016\/j.inffus.2020.11.002_bib0029","doi-asserted-by":"crossref","first-page":"1","DOI":"10.3390\/s18103337","article-title":"Second: Sparsely embedded convolutional detection","volume":"18","author":"Yan","year":"2018","journal-title":"Sensors (Switzerland)"},{"key":"10.1016\/j.inffus.2020.11.002_bib0030","article-title":"Patch refinement \u2013 localized 3D object detection","author":"Lehner","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0031","article-title":"Fast point R-CNN","author":"Chen","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0032","article-title":"Voxel-FPN: multi-scale voxel feature aggregation in 3D object detection from point clouds","author":"Wang","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0033","article-title":"PV-RCNN: point-voxel feature set abstraction for 3D object detection","author":"Shi","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0034","article-title":"Three-dimensional backbone network for 3D object detection in traffic scenes","author":"Li","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0035","doi-asserted-by":"crossref","DOI":"10.1016\/j.scs.2019.102002","article-title":"3D object detection based on sparse convolution neural network and feature fusion for autonomous driving in smart cities","volume":"54","author":"Wang","year":"2020","journal-title":"Sustain. Cities Soc."},{"key":"10.1016\/j.inffus.2020.11.002_bib0036","article-title":"From points to parts: 3D object detection from point cloud with part-aware and part-aggregation network","author":"Shi","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0037","unstructured":"C. R.Qi, H.Su, K.Mo, and L. J.Guibas, \u201cPointNet: deep learning on point sets for 3D classification and segmentation,\u201d 2017."},{"key":"10.1016\/j.inffus.2020.11.002_bib0038","first-page":"5099","article-title":"Pointnet++: Deep hierarchical feature learning on point sets in a metric space","author":"Qi","year":"2017","journal-title":"Adv. Neur. Inform. Process. Syst."},{"key":"10.1016\/j.inffus.2020.11.002_bib0039","article-title":"IPOD: intensive point-based object detector for point cloud","author":"Yang","year":"2018","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0040","article-title":"STD: sparse-to-dense 3D object detector for point cloud","author":"Yang","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0041","article-title":"PointRGCN: graph convolution networks for 3D vehicles detection refinement","author":"Zarzar","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0042","article-title":"LaserNet: an efficient probabilistic 3D object detector for autonomous driving","author":"Meyer","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0043","first-page":"244","article-title":"PointFusion: deep sensor fusion for 3D bounding box estimation","author":"Danfei\u202f","year":"2018","journal-title":"IEEE Conf. Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0044","first-page":"2510","article-title":"RoarNet: A Robust 3D object detection based on region approximation refinement","volume":"2019","author":"Shin","year":"2019","journal-title":"IEEE Intell. Veh. Symp. Proc."},{"key":"10.1016\/j.inffus.2020.11.002_bib0045","article-title":"PointPainting: sequential fusion for 3D object detection","author":"Vora","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0046","unstructured":"C. R.Qi, W.Liu, C.Wu, H.Su, and L. J.Guibas, \u201cFrustum PointNets for 3D object detection from RGB-D data,\u201d Nov. 2017, [Online]. Available: http:\/\/arxiv.org\/abs\/1711.08488."},{"key":"10.1016\/j.inffus.2020.11.002_bib0047","first-page":"1","article-title":"Frustum ConvNet\u202f: sliding frustums to aggregate local point-wise features for amodal 3D object detection","author":"Wang","year":"2019","journal-title":"Comp. Vis. Pattern Recogn."},{"key":"10.1016\/j.inffus.2020.11.002_bib0048","first-page":"9267","article-title":"3D object detection using scale invariant and feature reweighting networks","volume":"33","author":"Zhao","year":"2019","journal-title":"Proc. AAAI Conf. Artif. Intell."},{"key":"10.1016\/j.inffus.2020.11.002_bib0049","article-title":"PointPillars: fast encoders for object detection from point clouds","author":"Lang","year":"2018","journal-title":"Mach. Learn."},{"key":"10.1016\/j.inffus.2020.11.002_bib0050","article-title":"Vehicle detection from 3D Lidar using fully convolutional network","author":"Li","year":"2016","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0051","series-title":"2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","first-page":"6526","article-title":"Multi-view 3D object detection network for autonomous driving","author":"Chen","year":"2017"},{"key":"10.1016\/j.inffus.2020.11.002_bib0052","series-title":"IEEE Conf. Intell. Transp. Syst. Proceedings, ITSC","first-page":"3517","article-title":"BirdNet: a 3D object detection framework from LiDAR information","volume":"2018","author":"Beltr\u00e1n","year":"2018"},{"key":"10.1016\/j.inffus.2020.11.002_bib0053","series-title":"Proceedings of The 2nd Conference on Robot Learning","first-page":"146","article-title":"HDNET: exploiting HD maps for 3D object detection","volume":"87","author":"Yang","year":"2018"},{"issue":"4","key":"10.1016\/j.inffus.2020.11.002_bib0054","doi-asserted-by":"crossref","first-page":"3434","DOI":"10.1109\/LRA.2018.2852843","article-title":"RT3D: real-time 3-D vehicle detection in LiDAR point cloud for autonomous driving","volume":"3","author":"Zeng","year":"2018","journal-title":"IEEE Robot. Autom. Lett."},{"key":"10.1016\/j.inffus.2020.11.002_bib0055","series-title":"Proc. IEEE Comput. Soc. Conf. Comput. Vis. Pattern Recognit.","first-page":"7652","article-title":"PIXOR: real-time 3D object detection from point clouds","author":"Yang","year":"2018"},{"key":"10.1016\/j.inffus.2020.11.002_bib0056","series-title":"IEEE International Conference on Intelligent Robots and Systems","first-page":"5750","article-title":"Joint 3D proposal generation and object detection from view aggregation","author":"Ku","year":"2018"},{"key":"10.1016\/j.inffus.2020.11.002_bib0057","series-title":"ICASSP, IEEE Int. Conf. Acoust. Speech Signal Process. - Proc","first-page":"1992","article-title":"Scanet: spatial-channel attention network for 3D object detection","volume":"2019","author":"Lu","year":"2019"},{"key":"10.1016\/j.inffus.2020.11.002_bib0058","first-page":"663","article-title":"Deep continuous fusion for multi-sensor 3D object detection","volume":"11220","author":"Liang","year":"2018","journal-title":"Lect. Notes Comput. Sci. (including Subser. Lect. Notes Artif. Intell. Lect. Notes Bioinformatics)"},{"key":"10.1016\/j.inffus.2020.11.002_bib0059","first-page":"7337","article-title":"Multi-task multi-sensor fusion for 3D object detection","volume":"2019","author":"Liang","year":"2019","journal-title":"Proc. IEEE Comput. Soc. Conf. Comput. Vis. Pattern Recognit."},{"issue":"6","key":"10.1016\/j.inffus.2020.11.002_bib0060","doi-asserted-by":"crossref","first-page":"1434","DOI":"10.3390\/s19061434","article-title":"One-stage multi-sensor data fusion convolutional neural network for 3D object detection","volume":"19","author":"Li","year":"2019","journal-title":"Sensors"},{"key":"10.1016\/j.inffus.2020.11.002_bib0061","article-title":"Sensor fusion for joint 3D object detection and semantic segmentation","author":"Meyer","year":"2019","journal-title":"Comput. Vis. Pattern"},{"key":"10.1016\/j.inffus.2020.11.002_bib0062","article-title":"HVNet: hybrid voxel network for LiDAR based 3D object detection","author":"Ye","year":"2020","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0063","article-title":"Batch normalization: accelerating deep network training by reducing internal covariate shift","author":"Ioffe","year":"2015","journal-title":"Comput. Vis. Pattern"},{"key":"10.1016\/j.inffus.2020.11.002_bib0064","doi-asserted-by":"crossref","unstructured":"D.Zeng Wang and I.Posner, \u201cVoting for voting in online point cloud object detection,\u201d Jul. 2015, doi: 10.15607\/RSS.2015.XI.035.","DOI":"10.15607\/RSS.2015.XI.035"},{"issue":"4","key":"10.1016\/j.inffus.2020.11.002_bib0065","doi-asserted-by":"crossref","first-page":"810","DOI":"10.3390\/s19040810","article-title":"Object recognition, segmentation, and classification of mobile laser scanning point clouds: a state of the art review","volume":"19","author":"Che","year":"2019","journal-title":"Sensors"},{"issue":"6","key":"10.1016\/j.inffus.2020.11.002_bib0066","first-page":"84","article-title":"ImageNet classification with deep convolutional neural networks","volume":"60","author":"Krizhevsky","year":"2012","journal-title":"Neural Inf. Process. Syst."},{"key":"10.1016\/j.inffus.2020.11.002_bib0067","article-title":"Very deep convolutional networks for large-scale image recognition","author":"Simonyan","year":"2014","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0068","series-title":"Proceedings of the IEEE conference on computer vision and pattern recognition","first-page":"1","article-title":"Going deeper with convolutions","author":"Szegedy","year":"2015"},{"key":"10.1016\/j.inffus.2020.11.002_bib0069","doi-asserted-by":"crossref","unstructured":"K.He, X.Zhang, S.Ren, and J.Sun, \u201cDeep residual learning for image recognition,\u201d Dec. 2015.","DOI":"10.1109\/CVPR.2016.90"},{"key":"10.1016\/j.inffus.2020.11.002_bib0070","article-title":"Densely connected convolutional networks","author":"Huang","year":"2016","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0071","article-title":"Aggregated residual transformations for deep neural networks","author":"Xie","year":"2017","journal-title":"Cvpr"},{"key":"10.1016\/j.inffus.2020.11.002_bib0072","unstructured":"A. G.Howardet al., \u201cMobileNets: efficient convolutional neural networks for mobile vision applications,\u201d 2017."},{"key":"10.1016\/j.inffus.2020.11.002_bib0073","doi-asserted-by":"crossref","unstructured":"Z.Li, C.Peng, G.Yu, X.Zhang, Y.Deng, and J.Sun, \u201cDetNet: a backbone network for object detection,\u201d pp. 1\u201317, 2018.","DOI":"10.1007\/978-3-030-01240-3_21"},{"key":"10.1016\/j.inffus.2020.11.002_bib0074","series-title":"European conference on computer vision","first-page":"483","article-title":"Stacked hourglass networks for human pose estimation","author":"Newell","year":"2016"},{"key":"10.1016\/j.inffus.2020.11.002_bib0075","first-page":"765","article-title":"CornerNet: detecting objects as paired keypoints","volume":"11218","author":"Law","year":"2018","journal-title":"Eccv2018"},{"key":"10.1016\/j.inffus.2020.11.002_bib0076","article-title":"Objects as points","author":"Zhou","year":"2019","journal-title":"Comput. Vis. Pattern"},{"key":"10.1016\/j.inffus.2020.11.002_bib0077","first-page":"6568","article-title":"CenterNet: Keypoint triplets for object detection","volume":"2019","author":"Duan","year":"2019","journal-title":"Proc. IEEE Int. Conf. Comput. Vis."},{"key":"10.1016\/j.inffus.2020.11.002_bib0078","article-title":"Spatially-sparse convolutional neural networks","author":"Graham","year":"2014","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0079","article-title":"Sparse 3D convolutional neural networks","author":"Graham","year":"2015","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0080","article-title":"3D semantic segmentation with submanifold sparse convolutional networks","author":"Graham","year":"2017","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0081","article-title":"DeepGCNs: Making GCNs Go as Deep as CNNs","author":"Li","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0082","series-title":"2019 IEEE\/CVF International Conference on Computer Vision (ICCV)","first-page":"9266","article-title":"DeepGCNs: Can GCNs Go As Deep As CNNs?","author":"Li","year":"2019"},{"key":"10.1016\/j.inffus.2020.11.002_bib0083","article-title":"Deep closest point: learning representations for point cloud registration","author":"Wang","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0084","series-title":"2019 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","first-page":"10288","article-title":"Graph attention convolution for point cloud semantic segmentation","author":"Wang","year":"2019"},{"issue":"5","key":"10.1016\/j.inffus.2020.11.002_bib0085","doi-asserted-by":"crossref","DOI":"10.1145\/3326362","article-title":"Dynamic graph CNN for learning on point clouds","volume":"38","author":"Wang","year":"2019","journal-title":"ACM Trans. Graph."},{"key":"10.1016\/j.inffus.2020.11.002_bib0086","series-title":"2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","first-page":"2129","article-title":"Exploit all the layers: fast and accurate CNN object detector with scale dependent pooling and cascaded rejection classifiers","author":"Yang","year":"2016"},{"key":"10.1016\/j.inffus.2020.11.002_bib0087","doi-asserted-by":"crossref","unstructured":"Y.Liu, H.Li, J.Yan, F.Wei, X.Wang, and X.Tang, \u201cRecurrent scale approximation for object detection in CNN,\u201d Jul. 2017, [Online]. Available: http:\/\/arxiv.org\/abs\/1707.09531.","DOI":"10.1109\/ICCV.2017.69"},{"key":"10.1016\/j.inffus.2020.11.002_bib0088","article-title":"Learning to refine object segments","author":"Pinheiro","year":"2016","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0089","series-title":"Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)","first-page":"21","article-title":"SSD: Single shot multibox detector","volume":"9905","author":"Liu","year":"2016"},{"key":"10.1016\/j.inffus.2020.11.002_bib0090","article-title":"Deep layer aggregation","author":"Yu","year":"2017","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0091","article-title":"Rich feature hierarchies for accurate object detection and semantic segmentation","author":"Girshick","year":"2013","journal-title":"Comput. Vis. Pattern"},{"key":"10.1016\/j.inffus.2020.11.002_bib0092","series-title":"2015 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","first-page":"3431","article-title":"Fully convolutional networks for semantic segmentation","author":"Long","year":"2015"},{"key":"10.1016\/j.inffus.2020.11.002_bib0093","article-title":"Feature pyramid networks for object detection","author":"Lin","year":"2016","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0094","article-title":"You only look once: unified, real-time object detection","author":"Redmon","year":"2015","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0095","article-title":"Object as hotspots: an anchor-free 3D object detection approach via firing of hotspots","author":"Chen","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"issue":"2","key":"10.1016\/j.inffus.2020.11.002_bib0096","doi-asserted-by":"crossref","first-page":"154","DOI":"10.1007\/s11263-013-0620-5","article-title":"Selective search for object recognition","volume":"104","author":"Uijlings","year":"2013","journal-title":"Int. J. Comput. Vis."},{"issue":"11","key":"10.1016\/j.inffus.2020.11.002_bib0097","doi-asserted-by":"crossref","first-page":"3212","DOI":"10.1109\/TNNLS.2018.2876865","article-title":"Object detection with deep learning: a review","volume":"30","author":"Zhao","year":"2019","journal-title":"IEEE Trans. Neural Networks Learn. Syst."},{"key":"10.1016\/j.inffus.2020.11.002_bib0098","article-title":"Cascade R-CNN: delving into high quality object detection","author":"Cai","year":"2017","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0099","doi-asserted-by":"crossref","unstructured":"T.Kong, A.Yao, Y.Chen, and F.Sun, \u201cHyperNet: towards accurate region proposal generation and joint object detection,\u201d Apr. 2016.","DOI":"10.1109\/CVPR.2016.98"},{"key":"10.1016\/j.inffus.2020.11.002_bib0100","article-title":"R-FCN: object detection via region-based fully convolutional networks","author":"Dai","year":"2016","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0101","article-title":"OverFeat: integrated recognition, localization and detection using convolutional networks","author":"Sermanet","year":"2013","journal-title":"Comput. Vis. Pattern"},{"key":"10.1016\/j.inffus.2020.11.002_bib0102","article-title":"Scalable object detection using deep neural networks","author":"Erhan","year":"2013","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0103","doi-asserted-by":"crossref","unstructured":"S.Bell, C. L.Zitnick, K.Bala, and R.Girshick, \u201cInside-outside net: detecting objects in context with skip pooling and recurrent neural networks,\u201d Dec. 2015.","DOI":"10.1109\/CVPR.2016.314"},{"key":"10.1016\/j.inffus.2020.11.002_bib0104","first-page":"44","article-title":"Transforming auto-encoders","author":"Hinton","year":"2011","journal-title":"ICANN"},{"key":"10.1016\/j.inffus.2020.11.002_bib0105","doi-asserted-by":"crossref","first-page":"2729","DOI":"10.1109\/CVPR.2011.5995538","article-title":"Learning invariance through imitation","author":"Taylor","year":"2011","journal-title":"CVPR 2011"},{"key":"10.1016\/j.inffus.2020.11.002_bib0106","series-title":"18th International Conference on Pattern Recognition (ICPR\u201906)","first-page":"850","article-title":"Efficient non-maximum suppression","author":"Neubeck","year":"2006"},{"key":"10.1016\/j.inffus.2020.11.002_bib0107","article-title":"Deep Hough Voting for 3D Object Detection in Point Clouds","author":"Qi","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0108","article-title":"SGPN: similarity group proposal network for 3D point cloud instance segmentation","author":"Wang","year":"2017","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0109","article-title":"Learning object bounding boxes for 3D instance segmentation on point clouds","author":"Yang","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0110","doi-asserted-by":"crossref","unstructured":"T.-Y.Lin, P.Goyal, R.Girshick, K.He, and P.Doll\u00e1r, \u201cFocal loss for dense object detection,\u201d Aug. 2017, [Online]. Available: http:\/\/arxiv.org\/abs\/1708.02002.","DOI":"10.1109\/ICCV.2017.324"},{"key":"10.1016\/j.inffus.2020.11.002_bib0111","article-title":"On denoising autoencoders trained to minimise binary cross-entropy","author":"Creswell","year":"2017","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0112","unstructured":"A.Bochkovskiy, C.-Y.Wang, and H.-Y. M.Liao, \u201cYOLOv4: optimal speed and accuracy of object detection,\u201d Apr. 2020."},{"key":"10.1016\/j.inffus.2020.11.002_bib0113","first-page":"1","article-title":"Frustum ConvNet: sliding frustums to aggregate local point-wise features for amodal 3D object detection","author":"Wang","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0114","series-title":"2012 IEEE Conference on Computer Vision and Pattern Recognition","first-page":"3354","article-title":"Are we ready for autonomous driving? The KITTI vision benchmark suite","author":"Geiger","year":"2012"},{"key":"10.1016\/j.inffus.2020.11.002_bib0115","unstructured":"APTIV, \u201cNuScenes Benchmark,\u201d 2020. https:\/\/www.nuscenes.org\/object-detection?externalData=all&mapData=all&modalities=Any (accessed Jul. 20, 2020)."},{"key":"10.1016\/j.inffus.2020.11.002_bib0116","article-title":"End to end learning for self-driving cars","author":"Bojarski","year":"2016","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0117","article-title":"Multimodal end-to-end autonomous driving","author":"Xiao","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0118","article-title":"Autonomous vehicle control: end-to-end learning in simulated urban environments","author":"Haavaldsen","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0119","unstructured":"KITTI, \u201cThe KITTI Vision Benchmark Suite,\u201d 2015. http:\/\/www.cvlibs.net\/datasets\/kitti\/eval_object.php?obj_benchmark=3d (accessed May 12, 2020)."},{"issue":"11","key":"10.1016\/j.inffus.2020.11.002_bib0120","doi-asserted-by":"crossref","first-page":"1231","DOI":"10.1177\/0278364913491297","article-title":"Vision meets robotics: The KITTI dataset","volume":"32","author":"Geiger","year":"2013","journal-title":"Int. J. Rob. Res."},{"key":"10.1016\/j.inffus.2020.11.002_bib0121","article-title":"nuScenes: A multimodal dataset for autonomous driving","author":"Caesar","year":"2019","journal-title":"Proc. IEEE\/CVF Conf. Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0122","article-title":"Scalability in perception for autonomous driving: Waymo open dataset","author":"Sun","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0123","article-title":"A2D2: Audi autonomous driving dataset","author":"Geyer","year":"2020","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0124","article-title":"The H3D dataset for full-surround 3D multi-object detection and tracking in crowded urban scenes","author":"Patil","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0125","article-title":"TrafficPredict: trajectory prediction for heterogeneous traffic-agents","author":"Ma","year":"2018","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0126","series-title":"European Conference on Computer Vision and Pattern Recognition","first-page":"524","article-title":"Hard negative mining for metric learning based zero-shot classification","author":"Bucher","year":"2016"},{"key":"10.1016\/j.inffus.2020.11.002_bib0127","series-title":"Proceedings of the IEEE conference on computer vision and pattern recognition","first-page":"761","article-title":"Training region-based object detectors with online hard example mining","author":"Shrivastava","year":"2016"},{"key":"10.1016\/j.inffus.2020.11.002_bib0128","first-page":"8577","article-title":"Gradient harmonized single-stage detector","volume":"33","author":"Li","year":"2019","journal-title":"Proc. AAAI Conf. Artif. Intell."},{"issue":"1","key":"10.1016\/j.inffus.2020.11.002_bib0129","first-page":"1","article-title":"Object detection and classification by decision-level fusion for intelligent vehicle systems","volume":"17","author":"Il Oh","year":"2017","journal-title":"Sensors (Switzerland)"},{"key":"10.1016\/j.inffus.2020.11.002_bib0130","article-title":"SVGA-Net: sparse voxel-graph attention network for 3D object detection from point clouds","author":"He","year":"2020","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0131","article-title":"DetectoRS: detecting objects with recursive feature pyramid and switchable atrous convolution","author":"Qiao","year":"2020","journal-title":"Comput. Vis. Pattern"},{"key":"10.1016\/j.inffus.2020.11.002_bib0132","article-title":"Small object detection using context and attention","author":"Lim","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"issue":"1","key":"10.1016\/j.inffus.2020.11.002_bib0133","doi-asserted-by":"crossref","first-page":"11307","DOI":"10.1038\/s41598-020-67529-x","article-title":"Object detection based on an adaptive attention mechanism","volume":"10","author":"Li","year":"2020","journal-title":"Sci. Rep."},{"key":"10.1016\/j.inffus.2020.11.002_bib0134","series-title":"2019 IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)","first-page":"1297","article-title":"Attentional pointnet for 3D-object detection in point clouds","author":"Paigwar","year":"2019"},{"key":"10.1016\/j.inffus.2020.11.002_bib0135","article-title":"On the relationship between self-attention and convolutional layers","author":"Cordonnier","year":"2019","journal-title":"Comput. Vis. Pattern"},{"key":"10.1016\/j.inffus.2020.11.002_bib0136","article-title":"Stand-alone self-attention in vision models","author":"Ramachandran","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0137","first-page":"270","article-title":"A survey on deep transfer learning","volume":"11141","author":"Tan","year":"2018","journal-title":"Lect. Notes Comput. Sci. (including Subser. Lect. Notes Artif. Intell. Lect. Notes Bioinformatics)"},{"key":"10.1016\/j.inffus.2020.11.002_bib0138","series-title":"Handbook of research on machine learning applications and trends: algorithms, methods, and techniques","first-page":"242","article-title":"Transfer learning","author":"Torrey","year":"2010"},{"key":"10.1016\/j.inffus.2020.11.002_bib0139","first-page":"1528","article-title":"A kernel theory of modern data augmentation","volume":"97","author":"Dao","year":"2018","journal-title":"Proc. Mach. Learn. Res."},{"key":"10.1016\/j.inffus.2020.11.002_bib0140","article-title":"RandAugment: Practical automated data augmentation with a reduced search space","author":"Cubuk","year":"2019","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0141","first-page":"9273","article-title":"Does data augmentation lead to positive margin?","volume":"2019","author":"Rajput","year":"2019","journal-title":"36th Int. Conf. Mach. Learn. ICML 2019"},{"key":"10.1016\/j.inffus.2020.11.002_bib0142","unstructured":"B.Settles, \u201cActive learning literature survey,\u201d 2010."},{"key":"10.1016\/j.inffus.2020.11.002_bib0143","unstructured":"S.Roy, A.Unmesh, and V. P.Namboodiri, \u201cDeep active learning for object detection,\u201d 2018."},{"key":"10.1016\/j.inffus.2020.11.002_bib0144","article-title":"Large-scale visual active learning with deep probabilistic ensembles","author":"Chitta","year":"2018","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0145","article-title":"Active learning for convolutional neural networks: a core-set approach","author":"Sener","year":"2017","journal-title":"Mach. Learn."},{"key":"10.1016\/j.inffus.2020.11.002_bib0146","article-title":"Localization-aware active learning for object detection","author":"Kao","year":"2018","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0147","doi-asserted-by":"crossref","unstructured":"H. H.Aghdam, A.Gonzalez-Garcia, J.van de Weijer, and A. M.L\u00f3pez, \u201cActive learning for deep detection neural networks,\u201d Nov. 2019.","DOI":"10.1109\/ICCV.2019.00377"},{"key":"10.1016\/j.inffus.2020.11.002_bib0148","article-title":"Active learning for deep object detection","author":"Brust","year":"2018","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0149","article-title":"Scalable active learning for object detection","author":"Haussmann","year":"2020","journal-title":"Comput. Vis. Pattern Recognit."},{"key":"10.1016\/j.inffus.2020.11.002_bib0150","series-title":"2018 IEEE\/CVF Conference on Computer Vision and Pattern Recognition","first-page":"3569","article-title":"Fast and furious: real time end-to-end 3D detection, tracking and motion forecasting with a single convolutional net","author":"Luo","year":"2018"},{"key":"10.1016\/j.inffus.2020.11.002_bib0151","series-title":"International Conference on Intelligent Robotics and Applications","first-page":"582","article-title":"A semantic segmentation based lidar SLAM system towards dynamic environments","author":"Jian","year":"2019"},{"issue":"7","key":"10.1016\/j.inffus.2020.11.002_bib0152","doi-asserted-by":"crossref","first-page":"2068","DOI":"10.3390\/s20072068","article-title":"A review of visual-LiDAR fusion based simultaneous localization and mapping","volume":"20","author":"Debeunne","year":"2020","journal-title":"Sensors"},{"key":"10.1016\/j.inffus.2020.11.002_bib0153","article-title":"Explainable artificial intelligence (XAI): concepts, taxonomies, opportunities and challenges toward responsible AI","author":"Arrieta","year":"2019","journal-title":"Artif. Intell."}],"container-title":["Information Fusion"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1566253520304097?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1566253520304097?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2025,10,27]],"date-time":"2025-10-27T13:01:11Z","timestamp":1761570071000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S1566253520304097"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,4]]},"references-count":153,"alternative-id":["S1566253520304097"],"URL":"https:\/\/doi.org\/10.1016\/j.inffus.2020.11.002","relation":{},"ISSN":["1566-2535"],"issn-type":[{"value":"1566-2535","type":"print"}],"subject":[],"published":{"date-parts":[[2021,4]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"Point-cloud based 3D object detection and classification methods for self-driving applications: A survey and taxonomy","name":"articletitle","label":"Article Title"},{"value":"Information Fusion","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.inffus.2020.11.002","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2020 Elsevier B.V. All rights reserved.","name":"copyright","label":"Copyright"}]}}