{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,18]],"date-time":"2026-01-18T23:24:16Z","timestamp":1768778656855,"version":"3.49.0"},"reference-count":82,"publisher":"Springer Science and Business Media LLC","issue":"6-7","license":[{"start":{"date-parts":[[2018,11,28]],"date-time":"2018-11-28T00:00:00Z","timestamp":1543363200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100012166","name":"National Key Research and Development Program","doi-asserted-by":"crossref","award":["2017YFA0700802"],"award-info":[{"award-number":["2017YFA0700802"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Comput Vis"],"published-print":{"date-parts":[[2019,6]]},"DOI":"10.1007\/s11263-018-1135-x","type":"journal-article","created":{"date-parts":[[2018,11,27]],"date-time":"2018-11-27T22:28:36Z","timestamp":1543357716000},"page":"701-718","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":50,"title":["Learning Discriminative Aggregation Network for Video-Based Face Recognition and Person Re-identification"],"prefix":"10.1007","volume":"127","author":[{"given":"Yongming","family":"Rao","sequence":"first","affiliation":[]},{"given":"Jiwen","family":"Lu","sequence":"additional","affiliation":[]},{"given":"Jie","family":"Zhou","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,11,28]]},"reference":[{"key":"1135_CR1","doi-asserted-by":"crossref","unstructured":"Baltieri, D., Vezzani, R., & Cucchiara, R. (2011). 3dpes: 3d people dataset for surveillance and forensics. In Proceedings of the 2011 joint ACM workshop on human gesture and behavior understanding, ACM, pp. 59\u201364.","DOI":"10.1145\/2072572.2072590"},{"key":"1135_CR2","doi-asserted-by":"crossref","unstructured":"Beveridge, J. R., Phillips, P. J., Bolme, D. S., Draper, B. A., Givens, G. H., Lui, Y. M., et al. (2013). The challenge of face recognition from digital point-and-shoot cameras. In 2013 IEEE sixth international conference on BTAS, pp. 1\u20138.","DOI":"10.1109\/BTAS.2013.6712704"},{"key":"1135_CR3","doi-asserted-by":"crossref","unstructured":"Cao, Q., Shen, L., Xie, W., Parkhi, O. M., & Zisserman, A. (2018). Vggface2: A dataset for recognising faces across pose and age. In 2018 13th IEEE international conference on automatic face and gesture recognition (FG 2018), IEEE, pp. 67\u201374.","DOI":"10.1109\/FG.2018.00020"},{"key":"1135_CR4","doi-asserted-by":"crossref","unstructured":"Cevikalp, H., & Triggs, B. (2010). Face recognition based on image sets. In 2010 IEEE conference on CVPR, pp. 2567\u20132573.","DOI":"10.1109\/CVPR.2010.5539965"},{"key":"1135_CR5","unstructured":"Chen, X., Duan, Y., Houthooft, R., Schulman, J,, Sutskever, I., & Abbeel, P. (2016b). Infogan: Interpretable representation learning by information maximizing generative adversarial nets. In NIPS, pp. 2172\u20132180."},{"key":"1135_CR6","doi-asserted-by":"crossref","unstructured":"Chen, J. C., Patel, V. M., & Chellappa, R. (2016a). Unconstrained face verification using deep CNN features. In 2016 IEEE winter conference on applications of computer vision (WACV), pp. 1\u20139.","DOI":"10.1109\/WACV.2016.7477557"},{"key":"1135_CR7","doi-asserted-by":"crossref","unstructured":"Chen, J. C., Ranjan, R., Kumar, A., Chen, C. H., Patel, V. M., & Chellappa, R. (2015). An end-to-end system for unconstrained face verification with deep convolutional neural networks. In Proceedings of the IEEE international conference on computer vision workshops, pp. 118\u2013126.","DOI":"10.1109\/ICCVW.2015.55"},{"key":"1135_CR8","unstructured":"Chen, Y. C., Patel, V. M., Phillips, P. J., & Chellappa, R. (2012). Dictionary-based face recognition from video, Springer, Berlin, pp. 766\u2013779 ."},{"key":"1135_CR9","unstructured":"Ding, C., & Tao, D. (2017). Trunk-branch ensemble convolutional neural networks for video-based face recognition. In PAMI."},{"key":"1135_CR10","doi-asserted-by":"crossref","unstructured":"Dong, C., Loy, C. C., He, K., & Tang, X. (2014). Learning a deep convolutional network for image super-resolution. In ECCV, Springer, pp. 184\u2013199.","DOI":"10.1007\/978-3-319-10593-2_13"},{"issue":"2","key":"1135_CR11","doi-asserted-by":"publisher","first-page":"295","DOI":"10.1109\/TPAMI.2015.2439281","volume":"38","author":"C Dong","year":"2016","unstructured":"Dong, C., Loy, C. C., He, K., & Tang, X. (2016). Image super-resolution using deep convolutional networks. T-PAMI, 38(2), 295\u2013307.","journal-title":"T-PAMI"},{"key":"1135_CR12","doi-asserted-by":"crossref","unstructured":"Felzenszwalb, P. F., Girshick, R. B., & McAllester, D. (2010). Cascade object detection with deformable part models. In 2010 IEEE conference on CVPR, IEEE, pp. 2241\u20132248.","DOI":"10.1109\/CVPR.2010.5539906"},{"key":"1135_CR13","unstructured":"Goodfellow, I., Pouget-Abadie, J., Mirza, M., Xu, B., Warde-Farley, D., Ozair, S., Courville, A., & Bengio, Y. (2014). Generative adversarial nets. In NIPS, pp. 2672\u20132680."},{"key":"1135_CR14","unstructured":"Gray, D., Brennan, S., & Tao, H. (2007). Evaluating appearance models for recognition, reacquisition, and tracking. In PETS, Citeseer, Vol. 3, pp. 1\u20137."},{"key":"1135_CR15","doi-asserted-by":"crossref","unstructured":"Guillaumin, M., Verbeek, J., & Schmid, C. (2009). Is that you? Metric learning approaches for face identification. In ICCV, pp. 498\u2013505.","DOI":"10.1109\/ICCV.2009.5459197"},{"key":"1135_CR16","doi-asserted-by":"crossref","unstructured":"Hassner, T., Masi, I., Kim, J., Choi, J., Harel, S., Natarajan, P., et al. (2016). Pooling faces: Template based face recognition with pooled face images. In CVPRW, pp. 59\u201367.","DOI":"10.1109\/CVPRW.2016.23"},{"issue":"4","key":"1135_CR17","doi-asserted-by":"publisher","first-page":"713","DOI":"10.1109\/TPAMI.2014.2353635","volume":"37","author":"M Hayat","year":"2015","unstructured":"Hayat, M., Bennamoun, M., & An, S. (2015). Deep reconstruction models for image set classification. PAMI, 37(4), 713\u2013727.","journal-title":"PAMI"},{"key":"1135_CR18","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., & Sun, J. (2015). Delving deep into rectifiers: Surpassing human-level performance on imagenet classification. In ICCV, pp. 1026\u20131034.","DOI":"10.1109\/ICCV.2015.123"},{"key":"1135_CR19","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., & Sun, J. (2016). Deep residual learning for image recognition. In CVPR, pp. 770\u2013778.","DOI":"10.1109\/CVPR.2016.90"},{"key":"1135_CR20","unstructured":"Hermans, A., Beyer, L., Leibe, B. (2017). In defense of the triplet loss for person re-identification. arXiv preprint \n                    arXiv:1703.07737\n                    \n                  ."},{"key":"1135_CR21","unstructured":"Hirzer, M., Beleznai, C., Roth, P. M., & Bischof, H. (2011). Person re-identification by descriptive and discriminative classification, Springer, Berlin, pp. 91\u2013102."},{"key":"1135_CR22","doi-asserted-by":"crossref","unstructured":"Hu, J., Lu, J., & Tan, Y. P. (2014a). Discriminative deep metric learning for face verification in the wild. In CVPR, pp. 1875\u20131882.","DOI":"10.1109\/CVPR.2014.242"},{"key":"1135_CR23","doi-asserted-by":"crossref","unstructured":"Hu, J., Lu, J., Yuan, J., & Tan, Y. P. (2014b). Large margin multi-metric learning for face and kinship verification in the wild. In ACCV, pp. 252\u2013267.","DOI":"10.1007\/978-3-319-16811-1_17"},{"key":"1135_CR24","doi-asserted-by":"crossref","unstructured":"Hu, Y., Mian, A. S., & Owens, R. (2011). Sparse approximated nearest points for image set classification. In Computer vision and pattern recognition, pp. 121\u2013128.","DOI":"10.1109\/CVPR.2011.5995500"},{"key":"1135_CR25","doi-asserted-by":"crossref","unstructured":"Hu, J., Shen, L., & Sun, G. (2018). Squeeze-and-excitation networks. IEEE Conference on Computer Vision and Pattern Recognition.","DOI":"10.1109\/CVPR.2018.00745"},{"key":"1135_CR26","unstructured":"Huang, Z., & Van\u00a0Gool, L. (2016). A riemannian network for SPD matrix learning. arXiv preprint \n                    arXiv:1608.04233\n                    \n                  ."},{"key":"1135_CR27","unstructured":"Huang, G. B., Ramesh, M., Berg, T., & Learned-Miller, E. (2007). Labeled faces in the wild: A database for studying face recognition in unconstrained environments. Technical report 07\u201349, University of Massachusetts, Amherst."},{"key":"1135_CR28","doi-asserted-by":"crossref","unstructured":"Huang, Z., Wang, R., Shan, S., & Chen, X. (2014). Learning euclidean-to-riemannian metric for point-to-set classification. In CVPR, pp. 1677\u20131684.","DOI":"10.1109\/CVPR.2014.217"},{"key":"1135_CR29","unstructured":"Huang, Z., Wang, R., Shan, S., Li, X., & Chen, X. (2015). Log-euclidean metric learning on symmetric positive definite manifold with application to image set classification. In ICML, pp. 720\u2013729."},{"key":"1135_CR30","unstructured":"Huang, Z., Wu, J., & Van\u00a0Gool, L. (2016). Building deep networks on grassmann manifolds. arXiv preprint \n                    arXiv:1611.05742\n                    \n                  ."},{"key":"1135_CR31","unstructured":"Ioffe, S., & Szegedy, C. (2015). Batch normalization: Accelerating deep network training by reducing internal covariate shift. arXiv preprint \n                    arXiv:1502.03167\n                    \n                  ."},{"key":"1135_CR32","doi-asserted-by":"crossref","unstructured":"Ionescu, C., Vantzos, O., & Sminchisescu, C. (2015). Matrix backpropagation for deep networks with structured layers. In ICCV, pp. 2965\u20132973.","DOI":"10.1109\/ICCV.2015.339"},{"key":"1135_CR33","unstructured":"Isola, P., Zhu, J. Y., Zhou, T., & Efros, A. A. (2016). Image-to-image translation with conditional adversarial networks. arXiv preprint \n                    arXiv:1611.07004\n                    \n                  ."},{"key":"1135_CR34","unstructured":"Jaderberg, M., Simonyan, K., Zisserman, A., et al. (2015). Spatial transformer networks. In NIPS, pp. 2017\u20132025."},{"key":"1135_CR35","doi-asserted-by":"crossref","unstructured":"Jia, Y., Shelhamer, E., Donahue, J., Karayev, S., Long, J., Girshick, R., et al. (2014). Caffe: Convolutional architecture for fast feature embedding. In ACM-MM, pp. 675\u2013678.","DOI":"10.1145\/2647868.2654889"},{"key":"1135_CR36","unstructured":"Kawanishi, Y., Wu, Y., Mukunoki, M., & Minoh, M. (2014). Shinpuhkan2014: A multi-camera pedestrian dataset for tracking people across multiple cameras. In 20th Korea-Japan joint workshop on frontiers of computer vision (Vol. 5, p. 6)."},{"key":"1135_CR37","unstructured":"Kim, M., Kumar, S., Pavlovic, V., & Rowley, H. (2008). Face tracking and recognition with visual constraints in real-world videos. In CVPR, pp. 1\u20138."},{"key":"1135_CR38","unstructured":"Kingma, D., & Ba, J. (2014). Adam: A method for stochastic optimization. arXiv preprint \n                    arXiv:1412.6980\n                    \n                  ."},{"key":"1135_CR39","unstructured":"Kingma, D. P., & Welling, M. (2013). Auto-encoding variational bayes. arXiv preprint \n                    arXiv:1312.6114\n                    \n                  ."},{"key":"1135_CR40","doi-asserted-by":"crossref","unstructured":"Klare, B. F., Klein, B., Taborsky, E., Blanton, A., Cheney, J., Allen, K., et al. (2015). Pushing the frontiers of unconstrained face detection and recognition: Iarpa janus benchmark a. In CVPR, pp. 1931\u20131939.","DOI":"10.1109\/CVPR.2015.7298803"},{"key":"1135_CR41","unstructured":"Larsen, A. B. L., S\u00f8nderby, S. K., Larochelle, H., & Winther, O. (2015). Autoencoding beyond pixels using a learned similarity metric. arXiv preprint \n                    arXiv:1512.09300\n                    \n                  ."},{"key":"1135_CR42","unstructured":"Ledig, C., Theis, L., Husz\u00e1r, F., Caballero, J., Cunningham, A., Acosta, A., Aitken, A., Tejani, A., Totz, J., Wang, Z., et\u00a0al. (2016). Photo-realistic single image super-resolution using a generative adversarial network. arXiv preprint \n                    arXiv:1609.04802\n                    \n                  ."},{"key":"1135_CR43","doi-asserted-by":"crossref","unstructured":"Li, W., & Wang, X. (2013). Locally aligned feature transforms across views. In CVPR, pp. 3594\u20133601.","DOI":"10.1109\/CVPR.2013.461"},{"key":"1135_CR44","doi-asserted-by":"crossref","unstructured":"Li, H., Hua, G., Shen, X., Lin, Z., & Brandt, J. (2014a). Eigen-pep for video face recognition. In ACCV, pp. 17\u201333.","DOI":"10.1007\/978-3-319-16811-1_2"},{"key":"1135_CR45","doi-asserted-by":"crossref","unstructured":"Li, W., Zhao, R., Xiao, T., & Wang, X. (2014b). Deepreid: Deep filter pairing neural network for person re-identification. In CVPR, pp. 152\u2013159.","DOI":"10.1109\/CVPR.2014.27"},{"key":"1135_CR46","doi-asserted-by":"crossref","unstructured":"Lin, J., Ren, L., Lu, J., Feng, J., & Zhou, J. (2017). Consistent-aware deep learning for person re-identification in a camera network. In CVPR, pp. 5771\u20135780.","DOI":"10.1109\/CVPR.2017.362"},{"key":"1135_CR47","doi-asserted-by":"crossref","unstructured":"Liu, Y., Yan, J., & Ouyang, W. (2017). Quality aware network for set to set recognition. In CVPR, Vol. 2, p. 8.","DOI":"10.1109\/CVPR.2017.499"},{"key":"1135_CR48","doi-asserted-by":"crossref","unstructured":"Lu, J., Wang, G., & Moulin, P. (2013). Image set classification using holistic multiple order statistics features and localized multi-kernel metric learning. In ICCV, pp. 329\u2013336.","DOI":"10.1109\/ICCV.2013.48"},{"key":"1135_CR49","doi-asserted-by":"crossref","unstructured":"Lu, J., Wang, G., Deng, W., Moulin, P., & Zhou, J. (2015). Multi-manifold deep metric learning for image set classification. In CVPR, pp. 1137\u20131145.","DOI":"10.1109\/CVPR.2015.7298717"},{"issue":"3","key":"1135_CR50","first-page":"529","volume":"26","author":"J Lu","year":"2016","unstructured":"Lu, J., Wang, G., & Moulin, P. (2016). Localized multifeature metric learning for image-set-based face recognition. TCSVT, 26(3), 529\u2013540.","journal-title":"TCSVT"},{"issue":"Nov","key":"1135_CR51","first-page":"2579","volume":"9","author":"M Lvd","year":"2008","unstructured":"Lvd, M., & Hinton, G. (2008). Visualizing data using t-sne. JMLR, 9(Nov), 2579\u20132605.","journal-title":"JMLR"},{"key":"1135_CR52","doi-asserted-by":"crossref","unstructured":"Parkhi, O. M., Vedaldi, A., & Zisserman, A. (2015). Deep face recognition. In BMVC, Vol. 1, p. 6.","DOI":"10.5244\/C.29.41"},{"key":"1135_CR53","unstructured":"Paszke, A., Gross, S., Chintala, S., & Chanan, G. (2017). Pytorch: Tensors and dynamic neural networks in python with strong GPU acceleration."},{"key":"1135_CR54","unstructured":"Radford, A., Metz, L., Chintala, S. (2015). Unsupervised representation learning with deep convolutional generative adversarial networks. arXiv preprint \n                    arXiv:1511.06434\n                    \n                  ."},{"key":"1135_CR55","doi-asserted-by":"crossref","unstructured":"Rao, Y., Lin, J., Lu, J., & Zhou, J. (2017). Learning discriminative aggregation network for video-based face recognition. In ICCV, pp. 3781\u20133790.","DOI":"10.1109\/ICCV.2017.408"},{"key":"1135_CR56","unstructured":"Reed, S., Akata, Z., Yan, X., Logeswaran, L., Schiele, B., & Lee, H. (2016). Generative adversarial text to image synthesis. In ICML, Vol. 3."},{"key":"1135_CR57","doi-asserted-by":"crossref","unstructured":"Schroff, F., Kalenichenko, D., & Philbin, J. (2015). Facenet: A unified embedding for face recognition and clustering. In CVPR, pp. 815\u2013823.","DOI":"10.1109\/CVPR.2015.7298682"},{"key":"1135_CR58","doi-asserted-by":"crossref","unstructured":"Shi, W., Caballero, J., Husz\u00e1r, F., Totz, J., Aitken, A. P., Bishop, R., et al. (2016). Real-time single image and video super-resolution using an efficient sub-pixel convolutional neural network. In CVPR, pp. 1874\u20131883.","DOI":"10.1109\/CVPR.2016.207"},{"key":"1135_CR59","doi-asserted-by":"crossref","unstructured":"Sohn, K., Liu, S., Zhong, G., Yu, X., Yang, M. H., & Chandraker, M. (2017). Unsupervised domain adaptation for face recognition in unlabeled videos. In CVPR, pp. 3210\u20133218.","DOI":"10.1109\/ICCV.2017.630"},{"key":"1135_CR60","doi-asserted-by":"crossref","unstructured":"Sun, Y., Wang, X., & Tang, X. (2015). Deeply learned face representations are sparse, selective, and robust. In CVPR, pp. 2892\u20132900.","DOI":"10.1109\/CVPR.2015.7298907"},{"key":"1135_CR61","doi-asserted-by":"crossref","unstructured":"Taigman, Y., Yang, M., Ranzato, M., & Wolf, L. (2014). Closing the gap to human-level performance in face verification. In CVPR, pp. 1701\u20131708.","DOI":"10.1109\/CVPR.2014.220"},{"key":"1135_CR62","unstructured":"Tesfaye, Y. T., Zemene, E., Prati, A., Pelillo, M., & Shah, M. (2017). Multi-target tracking in multiple non-overlapping cameras using constrained dominant sets. arXiv preprint \n                    arXiv:1706.06196\n                    \n                  ."},{"key":"1135_CR63","doi-asserted-by":"crossref","unstructured":"Tran, L., Yin, X., & Liu, X. (2017). Disentangled representation learning gan for pose-invariant face recognition. In CVPR, Vol. 3, p. 7.","DOI":"10.1109\/CVPR.2017.141"},{"key":"1135_CR64","doi-asserted-by":"crossref","unstructured":"Wang, R., & Chen, X. (2009). Manifold discriminant analysis. In CVPR, pp. 429\u2013436.","DOI":"10.1109\/CVPR.2009.5206850"},{"key":"1135_CR65","unstructured":"Wang, R., Guo, H., Davis, L. S., & Dai, Q. (2012). Covariance discriminative learning: A natural and efficient approach to image set classification. In CVPR, pp. 2496\u20132503."},{"issue":"12","key":"1135_CR66","doi-asserted-by":"publisher","first-page":"2368","DOI":"10.1109\/TCYB.2014.2307067","volume":"44","author":"J Wang","year":"2014","unstructured":"Wang, J., Lu, C., Wang, M., Li, P., Yan, S., & Hu, X. (2014). Robust face recognition via adaptive sparse representation. IEEE Transactions on Cybernetics, 44(12), 2368\u20132378.","journal-title":"IEEE Transactions on Cybernetics"},{"issue":"12","key":"1135_CR67","doi-asserted-by":"publisher","first-page":"2501","DOI":"10.1109\/TPAMI.2016.2522418","volume":"38","author":"T Wang","year":"2016","unstructured":"Wang, T., Gong, S., Zhu, X., & Wang, S. (2016). Person re-identification by discriminative selection in video ranking. IEEE Transactions on Pattern Analysis and Machine Intelligence, 38(12), 2501\u20132514.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"1135_CR68","doi-asserted-by":"crossref","unstructured":"Wen, Y., Zhang, K., Li, Z., & Qiao, Y. (2016). A discriminative feature learning approach for deep face recognition. In ECCV, pp. 499\u2013515.","DOI":"10.1007\/978-3-319-46478-7_31"},{"key":"1135_CR69","doi-asserted-by":"crossref","unstructured":"Whitelam, C., Taborsky, E., Blanton, A., Maze, B., Adams, J. C., Miller, T., et al. (2017). Iarpa janus benchmark-b face dataset. In Workshops on CVPR, pp. 592\u2013600.","DOI":"10.1109\/CVPRW.2017.87"},{"key":"1135_CR70","doi-asserted-by":"crossref","unstructured":"Wolf, L., Hassner, T., & Maoz, I. (2011). Face recognition in unconstrained videos with matched background similarity. In CVPR, pp. 529\u2013534.","DOI":"10.1109\/CVPR.2011.5995566"},{"issue":"2","key":"1135_CR71","doi-asserted-by":"publisher","first-page":"210","DOI":"10.1109\/TPAMI.2008.79","volume":"31","author":"J Wright","year":"2009","unstructured":"Wright, J., Yang, A. Y., Ganesh, A., Sastry, S. S., & Ma, Y. (2009). Robust face recognition via sparse representation. IEEE Transactions on Analysis and Machine Intelligence, 31(2), 210\u2013227.","journal-title":"IEEE Transactions on Analysis and Machine Intelligence"},{"key":"1135_CR72","doi-asserted-by":"crossref","unstructured":"Xiao, T., Li, H., Ouyang, W., & Wang, X. (2016). Learning deep feature representations with domain guided dropout for person re-identification. In CVPR, pp. 1249\u20131258.","DOI":"10.1109\/CVPR.2016.140"},{"key":"1135_CR73","doi-asserted-by":"crossref","unstructured":"Yang, J., Ren, P., Chen, D., Wen, F., Li, H., & Hua, G. (2016a). Neural aggregation network for video face recognition. arXiv preprint \n                    arXiv:1603.05474\n                    \n                  .","DOI":"10.1109\/CVPR.2017.554"},{"key":"1135_CR74","doi-asserted-by":"crossref","unstructured":"Yang, M., Wang, X., Liu, W., & Shen, L. (2016b). Joint regularized nearest points for image set based face recognition. In: IVC.","DOI":"10.1016\/j.imavis.2016.07.008"},{"key":"1135_CR75","doi-asserted-by":"crossref","unstructured":"Zhang, H., Xu, T., Li, H., Zhang, S., Huang, X., Wang, X., & Metaxas, D. (2016a). Stackgan: Text to photo-realistic image synthesis with stacked generative adversarial networks. arXiv preprint \n                    arXiv:1612.03242\n                    \n                  .","DOI":"10.1109\/ICCV.2017.629"},{"issue":"10","key":"1135_CR76","first-page":"1499","volume":"23","author":"K Zhang","year":"2016","unstructured":"Zhang, K., Zhang, Z., Li, Z., & Qiao, Y. (2016b). Joint face detection and alignment using multitask cascaded convolutional networks. SPL, 23(10), 1499\u20131503.","journal-title":"SPL"},{"key":"1135_CR77","unstructured":"Zhang, W., Hu, S., & Liu, K. (2017). Learning compact appearance representation for video-based person re-identification. arXiv preprint \n                    arXiv:1702.06294\n                    \n                  ."},{"key":"1135_CR78","doi-asserted-by":"crossref","unstructured":"Zheng, L., Bie, Z., Sun, Y., Wang, J., Su, C., Wang, S., et al. (2016). Mars: A video benchmark for large-scale person re-identification. In ECCV, Springer, pp. 868\u2013884.","DOI":"10.1007\/978-3-319-46466-4_52"},{"key":"1135_CR79","doi-asserted-by":"crossref","unstructured":"Zheng, L., Shen, L., Tian, L., Wang, S., Wang, J., & Tian, Q. (2015). Scalable person re-identification: A benchmark. In ICCV, pp. 1116\u20131124.","DOI":"10.1109\/ICCV.2015.133"},{"key":"1135_CR80","doi-asserted-by":"crossref","unstructured":"Zheng, W. S., Gong, S., & Xiang, T. (2009). Associating groups of people. In BMVC, Vol. 2.","DOI":"10.5244\/C.23.23"},{"key":"1135_CR81","unstructured":"Zhong, Z., Zheng, L., Cao, D., & Li, S. (2017). Re-ranking person re-identification with k-reciprocal encoding. arXiv preprint \n                    arXiv:1701.08398\n                    \n                  ."},{"key":"1135_CR82","unstructured":"Zhou, Z., Huang, Y., Wang, W., Wang, L., & Tan, T. (2017). In CVPR, IEEE, pp. 6776\u20136785."}],"container-title":["International Journal of Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-018-1135-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s11263-018-1135-x\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-018-1135-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,11,27]],"date-time":"2019-11-27T19:07:20Z","timestamp":1574881640000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s11263-018-1135-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,11,28]]},"references-count":82,"journal-issue":{"issue":"6-7","published-print":{"date-parts":[[2019,6]]}},"alternative-id":["1135"],"URL":"https:\/\/doi.org\/10.1007\/s11263-018-1135-x","relation":{},"ISSN":["0920-5691","1573-1405"],"issn-type":[{"value":"0920-5691","type":"print"},{"value":"1573-1405","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018,11,28]]},"assertion":[{"value":"17 February 2018","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 November 2018","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 November 2018","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Compliance with Ethical Standards"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"This article does not contain any studies with human participants or animals.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical Approval"}}]}}