{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T17:46:10Z","timestamp":1777657570294,"version":"3.51.4"},"publisher-location":"Cham","reference-count":56,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783030585471","type":"print"},{"value":"9783030585488","type":"electronic"}],"license":[{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020]]},"DOI":"10.1007\/978-3-030-58548-8_37","type":"book-chapter","created":{"date-parts":[[2020,10,28]],"date-time":"2020-10-28T23:02:42Z","timestamp":1603926162000},"page":"638-655","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":34,"title":["Semantic Object Prediction and Spatial Sound Super-Resolution with Binaural Sounds"],"prefix":"10.1007","author":[{"given":"Arun Balajee","family":"Vasudevan","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dengxin","family":"Dai","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Luc","family":"Van Gool","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2020,10,29]]},"reference":[{"issue":"4","key":"37_CR1","doi-asserted-by":"publisher","first-page":"297","DOI":"10.1006\/csla.1994.1016","volume":"8","author":"Computational auditory scene analysis","year":"1994","unstructured":"Computational auditory scene analysis: Comput. Speech Lang. 8(4), 297\u2013336 (1994)","journal-title":"Comput. Speech Lang."},{"key":"37_CR2","doi-asserted-by":"crossref","unstructured":"Albanie, S., Nagrani, A., Vedaldi, A., Zisserman, A.: Emotion recognition in speech using cross-modal transfer in the wild. In: ACM Multimedia (2018)","DOI":"10.1145\/3240508.3240578"},{"issue":"10","key":"37_CR3","doi-asserted-by":"publisher","first-page":"2683","DOI":"10.1109\/TASL.2012.2210877","volume":"20","author":"F Antonacci","year":"2012","unstructured":"Antonacci, F., et al.: Inference of room geometry from acoustic impulse responses. IEEE Trans. Audio Speech Lang Process. 20(10), 2683\u20132695 (2012)","journal-title":"IEEE Trans. Audio Speech Lang Process."},{"key":"37_CR4","doi-asserted-by":"crossref","unstructured":"Arandjelovic, R., Zisserman, A.: Look, listen and learn. In: The IEEE International Conference on Computer Vision (ICCV) (2017)","DOI":"10.1109\/ICCV.2017.73"},{"key":"37_CR5","doi-asserted-by":"crossref","unstructured":"Arandjelovi\u0107, R., Zisserman, A.: Objects that sound. In: Proceedings of the European conference on computer vision (ECCV) (2018)","DOI":"10.1007\/978-3-030-01246-5_27"},{"issue":"1","key":"37_CR6","doi-asserted-by":"publisher","first-page":"87","DOI":"10.1016\/j.csl.2015.03.003","volume":"34","author":"S Argentieri","year":"2015","unstructured":"Argentieri, S., Dan\u00e8s, P., Sou\u00e8res, P.: A survey on sound source localization in robotics: from binaural to array processing methods. Comput. Speech Lang. 34(1), 87\u2013112 (2015)","journal-title":"Comput. Speech Lang."},{"key":"37_CR7","doi-asserted-by":"crossref","unstructured":"Aytar, Y., Vondrick, C., Torralba, A.: SoundNet: learning sound representations from unlabeled video. In: Advances in Neural Information Processing Systems (NIPS) (2016)","DOI":"10.1109\/CVPR.2016.18"},{"key":"37_CR8","doi-asserted-by":"crossref","unstructured":"Balajee Vasudevan, A., Dai, D., Van Gool, L.: Object referring in visual scene with spoken language. In: Winter Conference on Applications of Computer Vision (WACV) (2018)","DOI":"10.1109\/WACV.2018.00206"},{"key":"37_CR9","doi-asserted-by":"crossref","unstructured":"Barzelay, Z., Schechner, Y.Y.: Harmony in motion. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2007)","DOI":"10.1109\/CVPR.2007.383344"},{"key":"37_CR10","doi-asserted-by":"crossref","unstructured":"Brutzer, S., H\u00f6ferlin, B., Heidemann, G.: Evaluation of background subtraction techniques for video surveillance. In: The IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2011)","DOI":"10.1109\/CVPR.2011.5995508"},{"issue":"4","key":"37_CR11","doi-asserted-by":"publisher","first-page":"834","DOI":"10.1109\/TPAMI.2017.2699184","volume":"40","author":"LC Chen","year":"2017","unstructured":"Chen, L.C., Papandreou, G., Kokkinos, I., Murphy, K., Yuille, A.L.: DeepLab: semantic image segmentation with deep convolutional nets, atrous convolution, and fully connected CRFs. IEEE Trans. Pattern Anal. Mach. Intell. (TPAMI) 40(4), 834\u2013848 (2017)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell. (TPAMI)"},{"key":"37_CR12","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"833","DOI":"10.1007\/978-3-030-01234-2_49","volume-title":"Computer Vision \u2013 ECCV 2018","author":"L-C Chen","year":"2018","unstructured":"Chen, L.-C., Zhu, Y., Papandreou, G., Schroff, F., Adam, H.: Encoder-decoder with atrous separable convolution for semantic image segmentation. In: Ferrari, V., Hebert, M., Sminchisescu, C., Weiss, Y. (eds.) ECCV 2018. LNCS, vol. 11211, pp. 833\u2013851. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-030-01234-2_49"},{"key":"37_CR13","doi-asserted-by":"crossref","unstructured":"Cordts, M., et al.: The cityscapes dataset for semantic urban scene understanding. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2016)","DOI":"10.1109\/CVPR.2016.350"},{"issue":"7","key":"37_CR14","doi-asserted-by":"publisher","first-page":"1171","DOI":"10.1002\/rob.21887","volume":"36","author":"J Delmerico","year":"2019","unstructured":"Delmerico, J., et al.: The current state and future outlook of rescue robotics. J. Field Robot. 36(7), 1171\u20131191 (2019)","journal-title":"J. Field Robot."},{"key":"37_CR15","doi-asserted-by":"crossref","unstructured":"Deruyttere, T., Vandenhende, S., Grujicic, D., Van Gool, L., Moens, M.F.: Talk2Car: taking control of your self-driving car. In: EMNLP-IJCNLP (2019)","DOI":"10.18653\/v1\/D19-1215"},{"issue":"30","key":"37_CR16","doi-asserted-by":"publisher","first-page":"12186","DOI":"10.1073\/pnas.1221464110","volume":"110","author":"I Dokmanic","year":"2013","unstructured":"Dokmanic, I., Parhizkar, R., Walther, A., Lu, Y.M., Vetterli, M.: Acoustic echoes reveal room shape. Proc. Nat. Acad. Sci. 110(30), 12186\u201312191 (2013)","journal-title":"Proc. Nat. Acad. Sci."},{"key":"37_CR17","unstructured":"Fazenda, B., Atmoko, H., Gu, F., Guan, L., Ball, A.: Acoustic based safety emergency vehicle detection for intelligent transport systems. In: ICCAS-SICE (2009)"},{"issue":"3","key":"37_CR18","doi-asserted-by":"publisher","first-page":"373","DOI":"10.1162\/jocn.1993.5.3.373","volume":"5","author":"R Fendrich","year":"1993","unstructured":"Fendrich, R.: The merging of the senses. J. Cogn. Neurosci. 5(3), 373\u2013374 (1993)","journal-title":"J. Cogn. Neurosci."},{"key":"37_CR19","doi-asserted-by":"crossref","unstructured":"Gan, C., Zhao, H., Chen, P., Cox, D., Torralba, A.: Self-supervised moving vehicle tracking with stereo sound. In: The IEEE International Conference on Computer Vision (ICCV) (2019)","DOI":"10.1109\/ICCV.2019.00715"},{"key":"37_CR20","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"36","DOI":"10.1007\/978-3-030-01219-9_3","volume-title":"Computer Vision \u2013 ECCV 2018","author":"R Gao","year":"2018","unstructured":"Gao, R., Feris, R., Grauman, K.: Learning to separate object sounds by watching unlabeled video. In: Ferrari, V., Hebert, M., Sminchisescu, C., Weiss, Y. (eds.) ECCV 2018. LNCS, vol. 11207, pp. 36\u201354. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-030-01219-9_3"},{"key":"37_CR21","doi-asserted-by":"crossref","unstructured":"Gao, R., Grauman, K.: 2.5 D visual sound. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 324\u2013333 (2019)","DOI":"10.1109\/CVPR.2019.00041"},{"key":"37_CR22","doi-asserted-by":"crossref","unstructured":"Gao, R., Grauman, K.: Co-separating sounds of visual objects. In: The IEEE International Conference on Computer Vision (ICCV), October 2019","DOI":"10.1109\/ICCV.2019.00398"},{"issue":"1","key":"37_CR23","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1207\/s15326969eco0501_1","volume":"5","author":"WW Gaver","year":"1993","unstructured":"Gaver, W.W.: What in the world do we hear?: an ecological approach to auditory event perception. Ecol. Psychol. 5(1), 1\u201329 (1993)","journal-title":"Ecol. Psychol."},{"issue":"11","key":"37_CR24","doi-asserted-by":"publisher","first-page":"1231","DOI":"10.1177\/0278364913491297","volume":"32","author":"A Geiger","year":"2013","unstructured":"Geiger, A., Lenz, P., Stiller, C., Urtasun, R.: Vision meets robotics: the kitti dataset. Int. J. Robot. Res. (IJRR) 32(11), 1231\u20131237 (2013)","journal-title":"Int. J. Robot. Res. (IJRR)"},{"key":"37_CR25","doi-asserted-by":"crossref","unstructured":"Godard, C., Aodha, O.M., Firman, M., Brostow, G.J.: Digging into self-supervised monocular depth estimation. In: Proceedings of the IEEE International Conference on Computer Vision (CVPR), pp. 3828\u20133838 (2019)","DOI":"10.1109\/ICCV.2019.00393"},{"key":"37_CR26","doi-asserted-by":"crossref","unstructured":"Griffin, D., Lim, J.: Signal estimation from modified short-time Fourier transform. In: IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), vol. 8, pp. 804\u2013807 (1983)","DOI":"10.1109\/ICASSP.1983.1172092"},{"key":"37_CR27","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"449","DOI":"10.1007\/978-3-030-01234-2_27","volume-title":"Computer Vision \u2013 ECCV 2018","author":"S Hecker","year":"2018","unstructured":"Hecker, S., Dai, D., Van Gool, L.: End-to-end learning of driving models with surround-view cameras and route planners. In: Ferrari, V., Hebert, M., Sminchisescu, C., Weiss, Y. (eds.) ECCV 2018. LNCS, vol. 11211, pp. 449\u2013468. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-030-01234-2_27"},{"key":"37_CR28","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4614-4205-9","volume-title":"Human factors in augmented reality environments","author":"W Huang","year":"2012","unstructured":"Huang, W., Alem, L., Livingston, M.A.: Human factors in augmented reality environments. Springer, New York (2012). https:\/\/doi.org\/10.1007\/978-1-4614-4205-9"},{"key":"37_CR29","doi-asserted-by":"crossref","unstructured":"Irie, G., et al.: Seeing through sounds: predicting visual semantic segmentation results from multichannel audio signals. In: IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 3961\u20133964 (2019)","DOI":"10.1109\/ICASSP.2019.8683142"},{"key":"37_CR30","doi-asserted-by":"crossref","unstructured":"Kim, H., Remaggi, L., Jackson, P.J., Fazi, F.M., Hilton, A.: 3D room geometry reconstruction using audio-visual sensors. In: International Conference on 3D Vision (3DV), pp. 621\u2013629 (2017)","DOI":"10.1109\/3DV.2017.00076"},{"key":"37_CR31","unstructured":"Kingma, D.P., Ba, J.: Adam: a method for stochastic optimization. arXiv preprint arXiv:1412.6980 (2014)"},{"issue":"1","key":"37_CR32","doi-asserted-by":"publisher","first-page":"012378","DOI":"10.1155\/ASP\/2006\/12378","volume":"2006","author":"U Klee","year":"2006","unstructured":"Klee, U., Gehrig, T., McDonough, J.: Kalman filters for time delay of arrival-based source localization. EURASIP J. Adv. Signal Process. 2006(1), 012378 (2006)","journal-title":"EURASIP J. Adv. Signal Process."},{"issue":"4","key":"37_CR33","first-page":"12","volume":"37","author":"D Li","year":"2018","unstructured":"Li, D., Langlois, T.R., Zheng, C.: Scene-aware audio for 360$$^{\\circ }$$ videos. ACM Trans. Graph 37(4), 12 (2018)","journal-title":"ACM Trans. Graph"},{"key":"37_CR34","doi-asserted-by":"crossref","unstructured":"Marchegiani, L., Posner, I.: Leveraging the urban soundscape: auditory perception for smart vehicles. In: IEEE International Conference on Robotics and Automation (ICRA) (2017)","DOI":"10.1109\/ICRA.2017.7989774"},{"key":"37_CR35","doi-asserted-by":"publisher","first-page":"210","DOI":"10.3389\/fnins.2014.00210","volume":"8","author":"KI McAnally","year":"2014","unstructured":"McAnally, K.I., Martin, R.L.: Sound localization with head movement: implications for 3-d audio displays. Front. Neurosci. 8, 210 (2014)","journal-title":"Front. Neurosci."},{"key":"37_CR36","doi-asserted-by":"crossref","unstructured":"Mousavian, A., Pirsiavash, H., Ko\u0161eck\u00e1, J.: Joint semantic segmentation and depth estimation with deep convolutional networks. In: International Conference on 3D Vision (3DV), pp. 611\u2013619 (2016)","DOI":"10.1109\/3DV.2016.69"},{"key":"37_CR37","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"639","DOI":"10.1007\/978-3-030-01231-1_39","volume-title":"Computer Vision \u2013 ECCV 2018","author":"A Owens","year":"2018","unstructured":"Owens, A., Efros, A.A.: Audio-visual scene analysis with self-supervised multisensory features. In: Ferrari, V., Hebert, M., Sminchisescu, C., Weiss, Y. (eds.) ECCV 2018. LNCS, vol. 11210, pp. 639\u2013658. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-030-01231-1_39"},{"key":"37_CR38","doi-asserted-by":"crossref","unstructured":"Owens, A., Isola, P., McDermott, J., Torralba, A., Adelson, E.H., Freeman, W.T.: Visually indicated sounds. In: The IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2016)","DOI":"10.1109\/CVPR.2016.264"},{"key":"37_CR39","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"801","DOI":"10.1007\/978-3-319-46448-0_48","volume-title":"Computer Vision \u2013 ECCV 2016","author":"A Owens","year":"2016","unstructured":"Owens, A., Wu, J., McDermott, J.H., Freeman, W.T., Torralba, A.: Ambient sound provides supervision for visual learning. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9905, pp. 801\u2013816. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46448-0_48"},{"key":"37_CR40","unstructured":"Morgado, P., Vasconcelos, N., Langlois, T., Wang, O.: Self-supervised generation of spatial audio for 360 deg video. In: Neural Information Processing Systems (NIPS) (2018)"},{"key":"37_CR41","doi-asserted-by":"publisher","first-page":"184","DOI":"10.1016\/j.robot.2017.07.011","volume":"96","author":"C Rascon","year":"2017","unstructured":"Rascon, C., Meza, I.: Localization of sound sources in robotics: a review. Robot. Auton. Syst. 96, 184\u2013210 (2017)","journal-title":"Robot. Auton. Syst."},{"issue":"3","key":"37_CR42","doi-asserted-by":"publisher","first-page":"181","DOI":"10.1207\/S15326969ECO1203_1","volume":"12","author":"LD Rosenblum","year":"2000","unstructured":"Rosenblum, L.D., Gordon, M.S., Jarquin, L.: Echolocating distance by moving and stationary listeners. Ecol. Psychol. 12(3), 181\u2013206 (2000)","journal-title":"Ecol. Psychol."},{"issue":"1\u20133","key":"37_CR43","doi-asserted-by":"publisher","first-page":"157","DOI":"10.1007\/s11263-007-0090-8","volume":"77","author":"BC Russell","year":"2008","unstructured":"Russell, B.C., Torralba, A., Murphy, K.P., Freeman, W.T.: LabelMe: a database and web-based tool for image annotation. Int. J. Comput. Vis. (IJCV) 77(1\u20133), 157\u2013173 (2008)","journal-title":"Int. J. Comput. Vis. (IJCV)"},{"key":"37_CR44","doi-asserted-by":"crossref","unstructured":"Salamon, J., Jacoby, C., Bello, J.P.: A dataset and taxonomy for urban sound research. In: ACM Multimedia (2014)","DOI":"10.1145\/2647868.2655045"},{"key":"37_CR45","doi-asserted-by":"crossref","unstructured":"Saxena, A., Ng, A.Y.: Learning sound location from a single microphone. In: IEEE International Conference on Robotics and Automation (ICRA) (2009)","DOI":"10.1109\/ROBOT.2009.5152861"},{"key":"37_CR46","doi-asserted-by":"crossref","unstructured":"Senocak, A., Oh, T.H., Kim, J., Yang, M.H., So Kweon, I.: Learning to localize sound source in visual scenes. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2018)","DOI":"10.1109\/CVPR.2018.00458"},{"key":"37_CR47","unstructured":"Simeoni, M.M.J.A., Kashani, S., Hurley, P., Vetterli, M.: DeepWave: a recurrent neural-network for real-time acoustic imaging. In: Neural Information Processing Systems (NIPS), p. 38 (2019)"},{"issue":"2","key":"37_CR48","doi-asserted-by":"publisher","first-page":"489","DOI":"10.1121\/1.1910605","volume":"42","author":"WR Thurlow","year":"1967","unstructured":"Thurlow, W.R., Mangels, J.W., Runge, P.S.: Head movements during sound localizationtd. J. Acoust. Soc. Am. 42(2), 489\u2013493 (1967)","journal-title":"J. Acoust. Soc. Am."},{"key":"37_CR49","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"252","DOI":"10.1007\/978-3-030-01216-8_16","volume-title":"Computer Vision \u2013 ECCV 2018","author":"Y Tian","year":"2018","unstructured":"Tian, Y., Shi, J., Li, B., Duan, Z., Xu, C.: Audio-visual event localization in unconstrained videos. In: Ferrari, V., Hebert, M., Sminchisescu, C., Weiss, Y. (eds.) ECCV 2018. LNCS, vol. 11206, pp. 252\u2013268. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-030-01216-8_16"},{"issue":"2","key":"37_CR50","doi-asserted-by":"publisher","first-page":"1918","DOI":"10.3390\/s140201918","volume":"14","author":"J Tiete","year":"2014","unstructured":"Tiete, J., Dom\u00ednguez, F., da Silva, B., Segers, L., Steenhaut, K., Touhafi, A.: SoundCompass: a distributed MEMS microphone array-based sensor for sound source localization. Sensors 14(2), 1918\u20131949 (2014)","journal-title":"Sensors"},{"key":"37_CR51","unstructured":"Urmson, C., et al.: Autonomous driving in urban environments: boss and the urban challenge. J. Field Robot. 25(8), 425\u2013466 (2008). Special Issue on the 2007 DARPA Urban Challenge, Part I"},{"key":"37_CR52","unstructured":"Vandenhende, S., Georgoulis, S., Proesmans, M., Dai, D., Van Gool, L.: Revisiting multi-task learning in the deep learning era. arXiv (2020)"},{"issue":"4","key":"37_CR53","doi-asserted-by":"publisher","first-page":"339","DOI":"10.1037\/h0054629","volume":"27","author":"H Wallach","year":"1940","unstructured":"Wallach, H.: The role of head movements and vestibular and visual cues in sound localization. J. Exp. Psychol. 27(4), 339 (1940)","journal-title":"J. Exp. Psychol."},{"key":"37_CR54","doi-asserted-by":"crossref","unstructured":"Ye, M., Zhang, Y., Yang, R., Manocha, D.: 3D reconstruction in the presence of glasses by acoustic and stereo fusion. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2015)","DOI":"10.1109\/CVPR.2015.7299122"},{"key":"37_CR55","doi-asserted-by":"crossref","unstructured":"Zhao, H., Gan, C., Ma, W.C., Torralba, A.: The sound of motions. In: The IEEE International Conference on Computer Vision (ICCV) (2019)","DOI":"10.1109\/ICCV.2019.00182"},{"key":"37_CR56","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"587","DOI":"10.1007\/978-3-030-01246-5_35","volume-title":"Computer Vision \u2013 ECCV 2018","author":"H Zhao","year":"2018","unstructured":"Zhao, H., Gan, C., Rouditchenko, A., Vondrick, C., McDermott, J., Torralba, A.: The sound of pixels. In: Ferrari, V., Hebert, M., Sminchisescu, C., Weiss, Y. (eds.) ECCV 2018. LNCS, vol. 11205, pp. 587\u2013604. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-030-01246-5_35"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2020"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-58548-8_37","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,29]],"date-time":"2024-10-29T00:17:19Z","timestamp":1730161039000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-58548-8_37"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020]]},"ISBN":["9783030585471","9783030585488"],"references-count":56,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-58548-8_37","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020]]},"assertion":[{"value":"29 October 2020","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Glasgow","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"United Kingdom","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2020","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"23 August 2020","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"28 August 2020","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"16","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2020","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2020.eu\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"OpenReview","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"5025","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"1360","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"27% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"7","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"The conference was held virtually due to the COVID-19 pandemic.","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}