{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T19:09:28Z","timestamp":1775243368460,"version":"3.50.1"},"publisher-location":"Cham","reference-count":38,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783030012335","type":"print"},{"value":"9783030012342","type":"electronic"}],"license":[{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018]]},"DOI":"10.1007\/978-3-030-01234-2_33","type":"book-chapter","created":{"date-parts":[[2018,10,5]],"date-time":"2018-10-05T12:13:11Z","timestamp":1538741591000},"page":"554-569","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":134,"title":["Small-Scale Pedestrian Detection Based on Topological Line Localization and Temporal Feature Aggregation"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9146-9386","authenticated-orcid":false,"given":"Tao","family":"Song","sequence":"first","affiliation":[]},{"given":"Leiyu","family":"Sun","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8065-5901","authenticated-orcid":false,"given":"Di","family":"Xie","sequence":"additional","affiliation":[]},{"given":"Haiming","family":"Sun","sequence":"additional","affiliation":[]},{"given":"Shiliang","family":"Pu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,10,6]]},"reference":[{"issue":"4","key":"33_CR1","doi-asserted-by":"publisher","first-page":"743","DOI":"10.1109\/TPAMI.2011.155","volume":"34","author":"P. Dollar","year":"2012","unstructured":"Dollar, P., Wojek, C., Schiele, B., Perona, P.: Pedestrian detection: an evaluation of the state of the art. In: PAMI, pp. 743\u2013761 (2012)","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"33_CR2","doi-asserted-by":"crossref","unstructured":"Dollar, P., Appel, R., Belongie, S., Perona, P.: Fast feature pyramids for object detection. In: PAMI (2014)","DOI":"10.1109\/TPAMI.2014.2300479"},{"key":"33_CR3","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"443","DOI":"10.1007\/978-3-319-46475-6_28","volume-title":"Computer Vision \u2013 ECCV 2016","author":"L Zhang","year":"2016","unstructured":"Zhang, L., Lin, L., Liang, X., He, K.: Is faster R-CNN doing well for pedestrian detection? In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9906, pp. 443\u2013457. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46475-6_28"},{"key":"33_CR4","unstructured":"Li, J., Liang, X., Shen, S.M., Xu, T., Feng, J., Yan, S.: Scale-aware fast R-CNN for pedestrian detection. In: Multimedia (2015)"},{"key":"33_CR5","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"354","DOI":"10.1007\/978-3-319-46493-0_22","volume-title":"Computer Vision \u2013 ECCV 2016","author":"Z Cai","year":"2016","unstructured":"Cai, Z., Fan, Q., Feris, R.S., Vasconcelos, N.: A unified multi-scale deep convolutional neural network for fast object detection. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9908, pp. 354\u2013370. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46493-0_22"},{"key":"33_CR6","unstructured":"Ren, S., He, K., Girshick, R., Sun, J.: Faster R-CNN: towards real-time object detection with region proposal networks. In: NIPS (2015)"},{"key":"33_CR7","unstructured":"Dai, J., Li, Y., He, K., Sun, J.: R-FCN: object detection via region-based fully convolutional networks. In: NIPS (2016)"},{"key":"33_CR8","first-page":"230","volume":"I","author":"A Balke","year":"1994","unstructured":"Balke, A., Pearl, J.: Probabilistic evaluation of counterfactual queries. AAA I, 230\u2013237 (1994)","journal-title":"AAA"},{"key":"33_CR9","doi-asserted-by":"crossref","unstructured":"Zhang, C., Li, H., Wang, X., Yang, X.: Cross-scene crowd counting via deep convolutional neural networks. In: CVPR, pp. 833\u2013841 (2015)","DOI":"10.1109\/CVPR.2015.7298684"},{"key":"33_CR10","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Zhou, D., Chen, S., Gao, S., Ma, Y.: Single-image crowd counting via multi-column convolutional neural network. In: CVPR, pp. 589\u2013597 (2016)","DOI":"10.1109\/CVPR.2016.70"},{"key":"33_CR11","doi-asserted-by":"crossref","unstructured":"Cao, Z., Simon, T., Wei, S.E., Sheikh, Y.: Realtime multi-person 2D pose estimation using part affinity fields. In: CVPR, pp. 7291\u20137299 (2017)","DOI":"10.1109\/CVPR.2017.143"},{"key":"33_CR12","doi-asserted-by":"crossref","unstructured":"Papandreou, G., et al.: Towards accurate multi-person pose estimation in the wild. In: CVPR, pp. 4903\u20134911 (2017)","DOI":"10.1109\/CVPR.2017.395"},{"key":"33_CR13","unstructured":"Li, C., Zhong, Q., Xie, D., Pu, S.: Skeleton-based action recognition with convolutional neural networks. In: ICMEW (2017)"},{"key":"33_CR14","doi-asserted-by":"crossref","unstructured":"Dollar, P., Wojek, C., Schiele, B., Perona, P.: Pedestrian detection: a benchmark. In: CVPR, pp. 304\u2013311 (2009)","DOI":"10.1109\/CVPR.2009.5206631"},{"key":"33_CR15","doi-asserted-by":"crossref","unstructured":"Zhang, S., Benenson, R., Schiele, B.: CityPersons: a diverse dataset for pedestrian detection. In: CVPR, pp. 3213\u20133221 (2017)","DOI":"10.1109\/CVPR.2017.474"},{"key":"33_CR16","doi-asserted-by":"crossref","unstructured":"Girshick, R., Donahue, J., Darrell, T., Malik, J.: Rich feature hierarchies for accurate object detection and semantic segmentation. In: CVPR, pp. 580\u2013587 (2014)","DOI":"10.1109\/CVPR.2014.81"},{"key":"33_CR17","doi-asserted-by":"crossref","unstructured":"Redmon, J., Divvala, S., Girshick, R., Farhadi, A.: You only look once: unified, real-time object detection. In: CVPR, pp. 779\u2013788 (2016)","DOI":"10.1109\/CVPR.2016.91"},{"key":"33_CR18","doi-asserted-by":"crossref","unstructured":"Redmon, J., Farhadi, A.: Yolo9000: better, faster, stronger. In: CVPR, pp. 7263\u20137271 (2017)","DOI":"10.1109\/CVPR.2017.690"},{"key":"33_CR19","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"21","DOI":"10.1007\/978-3-319-46448-0_2","volume-title":"Computer Vision \u2013 ECCV 2016","author":"W Liu","year":"2016","unstructured":"Liu, W., et al.: SSD: single shot multibox detector. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9905, pp. 21\u201337. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46448-0_2"},{"key":"33_CR20","doi-asserted-by":"crossref","unstructured":"Du, X., El-Khamy, M., Lee, J., Davis, L.: Fused DNN: a deep neural network fusion approach to fast and robust pedestrian detection. In: WACV (2017)","DOI":"10.1109\/WACV.2017.111"},{"key":"33_CR21","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: CVPR, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"33_CR22","doi-asserted-by":"crossref","unstructured":"Szegedy, C., Liu, W., Jia, Y., Sermanet, P., et al.: Going deeper with convolutions. In: CVPR, pp. 1\u20139 (2015)","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"33_CR23","doi-asserted-by":"crossref","unstructured":"Brazil, G., Yin, X., Liu, X.: Illuminating pedestrians via simultaneous detection & segmentation. In: ICCV, pp. 4950\u20134959 (2017)","DOI":"10.1109\/ICCV.2017.530"},{"key":"33_CR24","unstructured":"Zhang, X., Cheng, L., Li, B., Hu, H.M.: Too far to see? Not really !\u2013pedestrian detection with scale-aware localization policy. arXiv preprint (2017). arXiv: 1709.00235"},{"key":"33_CR25","doi-asserted-by":"crossref","unstructured":"Zhang, S., Benenson, R., Omran, M., Hosang, J., Schiele, B.: How far are we from solving pedestrian detection? In: CVPR, pp. 1259\u20131267 (2016)","DOI":"10.1109\/CVPR.2016.141"},{"key":"33_CR26","doi-asserted-by":"crossref","unstructured":"Kang, K., Ouyang, W., Li, H., Wang, X.: Object detection from video tubelets with convolutional neural networks. In: CVPR, pp. 817\u2013825 (2016)","DOI":"10.1109\/CVPR.2016.95"},{"key":"33_CR27","doi-asserted-by":"crossref","unstructured":"Zhu, X., Wang, Y., Dai, J., Yuan, L., Wei, Y.: Flow-guided feature aggregation for video object detection. In: ICCV, pp. 408\u2013417 (2017)","DOI":"10.1109\/ICCV.2017.52"},{"key":"33_CR28","doi-asserted-by":"crossref","unstructured":"Dosovitskiy, A., Fischery, P., Ilg, E., et al.: FlowNet: learning optical flow with convolutional networks. In: ICCV, pp. 2758\u20132766 (2015)","DOI":"10.1109\/ICCV.2015.316"},{"key":"33_CR29","unstructured":"Liu, M., Zhu, M.: Mobile video object detection with temporally-aware feature maps. arXiv preprint (2017). arXiv: 1711.06368"},{"issue":"4","key":"33_CR30","doi-asserted-by":"publisher","first-page":"225","DOI":"10.1137\/0202019","volume":"2","author":"JE Hopcroft","year":"1973","unstructured":"Hopcroft, J.E., Karp, R.M.: An $$n^{5\/2}$$ algorithm for maximum matching in bipartite graphs. SIAM J. Comput. 2(4), 225\u2013231 (1973)","journal-title":"SIAM J. Comput."},{"key":"33_CR31","first-page":"29","volume-title":"50 Years of Integer Programming 1958-2008","author":"Harold W. Kuhn","year":"2009","unstructured":"Kuhn, H.W.: The hungarian method for the assignment problem. 50 Years of Integer Programming 1958\u20132008 29\u201347"},{"key":"33_CR32","doi-asserted-by":"crossref","unstructured":"Ng, J.Y.H., Hausknecht, M., Vijayanarasimhan, S., Vinyals, O., Monga, R., Toderici, G.: Beyond short snippets: deep networks for video classification. In: CVPR, pp. 4694\u20134702 (2015)","DOI":"10.1109\/CVPR.2015.7299101"},{"key":"33_CR33","doi-asserted-by":"crossref","unstructured":"Grushin, A., Monner, D.D., Reggia, J.A., Mishra, A.: Robust human action recognition via long short-term memory. In: IJCNN (2013)","DOI":"10.1109\/IJCNN.2013.6706797"},{"key":"33_CR34","unstructured":"Shi, X., Chen, Z., Wang, H., Yeung, D.Y., Wang, W., WOO, W.: Convolutional LSTM network: a machine learning approach for precipitation nowcasting. In: NIPS, pp. 802\u2013810 (2015)"},{"key":"33_CR35","doi-asserted-by":"crossref","unstructured":"Geiger, A., Lenz, P., Urtasun, R.: Are we ready for autonomous driving? The kitti vision benchmark suite. In: CVPR (2012)","DOI":"10.1109\/CVPR.2012.6248074"},{"key":"33_CR36","doi-asserted-by":"crossref","unstructured":"Cordts, M., Omran, M., Ramos, S., et al.: The cityscapes dataset for semantic urban scene understanding. In: CVPR (2016)","DOI":"10.1109\/CVPR.2016.350"},{"key":"33_CR37","unstructured":"Ouyang, W., Zhou, H., Li, H., et al.: Jointly learning deep features, deformable parts, occlusion and classification for pedestrian detection. In: PAMI (2017)"},{"key":"33_CR38","doi-asserted-by":"crossref","unstructured":"Wang, X., Xiao, T., Jiang, Y., Shao, S., Sun, J., Shen, C.: Repulsion loss: detecting pedestrians in a crowd. arXiv preprint (2017). arXiv: 1711.07752","DOI":"10.1109\/CVPR.2018.00811"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2018"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-01234-2_33","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T18:33:53Z","timestamp":1775241233000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-01234-2_33"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018]]},"ISBN":["9783030012335","9783030012342"],"references-count":38,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-01234-2_33","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018]]},"assertion":[{"value":"6 October 2018","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Munich","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Germany","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2018","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"8 September 2018","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"14 September 2018","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"15","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2018","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2018.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}