{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,4]],"date-time":"2025-11-04T10:42:07Z","timestamp":1762252927588,"version":"3.37.3"},"reference-count":65,"publisher":"Springer Science and Business Media LLC","issue":"6-7","license":[{"start":{"date-parts":[[2019,2,16]],"date-time":"2019-02-16T00:00:00Z","timestamp":1550275200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61876178","61806196"],"award-info":[{"award-number":["61876178","61806196"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"National Key Research and Development Plan","award":["2016YFC0801002"],"award-info":[{"award-number":["2016YFC0801002"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Comput Vis"],"published-print":{"date-parts":[[2019,6]]},"DOI":"10.1007\/s11263-019-01162-8","type":"journal-article","created":{"date-parts":[[2019,2,18]],"date-time":"2019-02-18T09:42:02Z","timestamp":1550482922000},"page":"684-700","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":43,"title":["Large-Scale Bisample Learning on ID Versus Spot Face Recognition"],"prefix":"10.1007","volume":"127","author":[{"given":"Xiangyu","family":"Zhu","sequence":"first","affiliation":[]},{"given":"Hao","family":"Liu","sequence":"additional","affiliation":[]},{"given":"Zhen","family":"Lei","sequence":"additional","affiliation":[]},{"given":"Hailin","family":"Shi","sequence":"additional","affiliation":[]},{"given":"Fan","family":"Yang","sequence":"additional","affiliation":[]},{"given":"Dong","family":"Yi","sequence":"additional","affiliation":[]},{"given":"Guojun","family":"Qi","sequence":"additional","affiliation":[]},{"given":"Stan Z.","family":"Li","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2019,2,16]]},"reference":[{"key":"1162_CR1","doi-asserted-by":"crossref","unstructured":"Babbar, R., Sch\u00f6lkopf, B. (2017). Dismec: Distributed sparse machines for extreme multi-label classification. In Proceedings of the tenth ACM international conference on web search and data mining (pp. 721\u2013729). ACM.","DOI":"10.1145\/3018661.3018741"},{"key":"1162_CR2","doi-asserted-by":"crossref","unstructured":"Balntas, V., Riba, E., Ponsa, D., & Mikolajczyk, K. (2016). Learning local feature descriptors with triplets and shallow convolutional neural networks. In British machine vision conference (pp. 119.1\u2013119.11).","DOI":"10.5244\/C.30.119"},{"key":"1162_CR3","first-page":"1137","volume":"3","author":"Y Bengio","year":"2003","unstructured":"Bengio, Y., Ducharme, R., Vincent, P., & Jauvin, C. (2003). A neural probabilistic language model. Journal of Machine Learning Research, 3, 1137\u20131155.","journal-title":"Journal of Machine Learning Research"},{"key":"1162_CR4","unstructured":"Bertinetto, L., Henriques, J. F., Valmadre, J., Torr, P. H. S., & Vedaldi, A. (2016). Learning feed-forward one-shot learners. In Neural information processing systems (pp. 523\u2013531)."},{"key":"1162_CR5","unstructured":"Bhatia, K., Jain, H., Kar, P., Varma, M., & Jain, P. (2015). Sparse local embeddings for extreme multi-label classification. In Advances in neural information processing systems (pp. 730\u2013738)."},{"key":"1162_CR6","unstructured":"Cao, Q., Shen, L., Xie, W., Parkhi, O. M., & Zisserman, A. (2017). Vggface2: A dataset for recognising faces across pose and age. arXiv preprint arXiv:1710.08092 ."},{"key":"1162_CR7","doi-asserted-by":"crossref","unstructured":"Chen, W., Chen, X., Zhang, J., & Huang, K. (2017). Beyond triplet loss: A deep quadruplet network for person re-identification. In The conference on computer vision and pattern recognition (pp. 1320\u20131329).","DOI":"10.1109\/CVPR.2017.145"},{"key":"1162_CR8","doi-asserted-by":"crossref","unstructured":"Choe, J., Park, S., Kim, K., Hyun Park, J., Kim, D., & Shim, H. (2017). Face generation for low-shot learning using generative adversarial networks. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 1940\u20131948).","DOI":"10.1109\/ICCVW.2017.229"},{"key":"1162_CR9","unstructured":"Choromanska, A., Agarwal, A., & Langford, J. (2013). Extreme multi class classification. In NIPS Workshop: eXtreme Classification (submitted)."},{"issue":"4","key":"1162_CR10","doi-asserted-by":"publisher","first-page":"594","DOI":"10.1109\/TPAMI.2006.79","volume":"28","author":"L Feifei","year":"2006","unstructured":"Feifei, L., Fergus, R., & Perona, P. (2006). One-shot learning of object categories. IEEE Transactions on Pattern Analysis and Machine Intelligence, 28(4), 594\u2013611.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"1162_CR11","unstructured":"Feng, Z. -H., Kittler, J., Awais, M., Huber, P., & Wu, X. J. (2017). Wing loss for robust facial landmark localisation with convolutional neural networks. arXiv preprint arXiv:1711.06753 ."},{"key":"1162_CR12","unstructured":"Guo, Y., & Zhang, L. (2017). One-shot face recognition by promoting underrepresented classes. arXiv preprint arXiv:1707.05574 ."},{"key":"1162_CR13","doi-asserted-by":"crossref","unstructured":"Guo, Y., Zhang, L., Hu, Y., He, X., & Gao, J. J. (2016). Ms-celeb-1m: A dataset and benchmark for large-scale face recognition. In European conference on computer vision (pp. 87\u2013102). Springer.","DOI":"10.1007\/978-3-319-46487-9_6"},{"key":"1162_CR14","unstructured":"Gutmann, M., & Hyv\u00e4rinen, A. (2010). Noise-contrastive estimation: A new estimation principle for unnormalized statistical models. InProceedings of the thirteenth international conference on artificial intelligence and statistics (pp. 297\u2013304)."},{"key":"1162_CR15","unstructured":"Hariharan, B., & Girshick, R. (2016). Low-shot visual recognition by shrinking and hallucinating features. arXiv preprint arXiv:1606.02819 ."},{"key":"1162_CR16","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., & Sun, J. (2016). Deep residual learning for image recognition. In Computer Vision and Pattern Recognition (pp. 770\u2013778).","DOI":"10.1109\/CVPR.2016.90"},{"key":"1162_CR17","unstructured":"Hsu, D. J., Kakade, S. M., Langford, J., & Zhang, T. (2009). Multi-label prediction via compressed sensing. In Advances in neural information processing systems (pp. 772\u2013780)."},{"key":"1162_CR18","unstructured":"Huang, C., Loy, C. C., & Tang, X. (2016). Local similarity-aware deep feature embedding. In Advances in neural information processing systems (pp. 1262\u20131270)."},{"key":"1162_CR19","unstructured":"Huang, G. B., Mattar, M., Berg, T., & Learned-Miller, E. (2008). E: Labeled faces in the wild: A database for studying face recognition in unconstrained environments. In Workshop on faces in\u2018Real-Life\u2019 Images: detection, alignment, and recognition"},{"key":"1162_CR20","unstructured":"Koch, G., Zemel, R., & Salakhutdinov, R. (2015). Siamese neural networks for one-shot image recognition. In ICML deep learning workshop (Vol. 2)."},{"key":"1162_CR21","unstructured":"Krizhevsky, A., Sutskever, I., & Hinton, G. E. (2012). Imagenet classification with deep convolutional neural networks. In International conference on neural information processing systems (pp. 1097\u20131105)."},{"key":"1162_CR22","unstructured":"Kumar, V. B., Harwood, B., Carneiro, G., Reid, I., & Drummond, T. (2017). Smart mining for deep metric learning. arXiv preprint arXiv:1704.01285 ."},{"key":"1162_CR23","doi-asserted-by":"crossref","unstructured":"Liao, S., Lei, Z., Yi, D., & Li, S. Z. (2014). A benchmark study of large-scale unconstrained face recognition. In IEEE international joint conference on biometrics (pp. 1\u20138).","DOI":"10.1109\/BTAS.2014.6996301"},{"key":"1162_CR24","doi-asserted-by":"crossref","unstructured":"Liu, W., Wen, Y., Yu, Z., Li, M., Raj, B., & Song, L. (2017a). Sphereface: Deep hypersphere embedding for face recognition. In Proceedings of the IEEE conference on computer vision and pattern recognition.","DOI":"10.1109\/CVPR.2017.713"},{"key":"1162_CR25","unstructured":"Liu, W., Wen, Y., Yu, Z., & Yang, M. (2016). Large-margin softmax loss for convolutional neural networks. In ICML (pp. 507\u2013516)."},{"key":"1162_CR26","unstructured":"Liu, W., Zhang, Y. M., Li, X., Yu, Z., Dai, B., Zhao, T., & Song, L. (2017b). Deep hyperspherical learning. In Advances in neural information processing systems (pp. 3953\u20133963)."},{"key":"1162_CR27","unstructured":"Mnih, A., & Kavukcuoglu, K. (2013). Learning word embeddings efficiently with noise-contrastive estimation. In Advances in neural information processing systems (pp. 2265\u20132273)."},{"key":"1162_CR28","unstructured":"Mnih, A., & Teh, Y. W. (2012). A fast and simple algorithm for training neural probabilistic language models. arXiv preprint arXiv:1206.6426 ."},{"key":"1162_CR29","unstructured":"Nech, A., & Kemelmacher-Shlizerman, I. (2017). Level playing field for million scale face recognition. arXiv preprint arXiv:1705.00393 ."},{"key":"1162_CR30","doi-asserted-by":"crossref","unstructured":"Oh Song, H. Xiang, Y., Jegelka, S., & Savarese, S. (2016) Deep metric learning via lifted structured feature embedding. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 4004\u20134012).","DOI":"10.1109\/CVPR.2016.434"},{"key":"1162_CR31","doi-asserted-by":"crossref","unstructured":"Ouyang, W., Wang, X., Zhang, C., & Yang, X. (2016). Factors in finetuning deep model for object detection with long-tail distribution. In Computer vision and pattern recognition (pp. 864\u2013873).","DOI":"10.1109\/CVPR.2016.100"},{"issue":"3","key":"1162_CR32","first-page":"6","volume":"1","author":"OM Parkhi","year":"2015","unstructured":"Parkhi, O. M., Vedaldi, A., Zisserman, A., et al. (2015). Deep face recognition. BMVC, 1(3), 6.","journal-title":"BMVC"},{"key":"1162_CR33","doi-asserted-by":"crossref","unstructured":"Prabhu, Y., & Varma, M. (2014). Fastxml: A fast, accurate and stable tree-classifier for extreme multi-label learning. In Proceedings of the 20th ACM SIGKDD international conference on Knowledge discovery and data mining (pp. 263\u2013272). ACM.","DOI":"10.1145\/2623330.2623651"},{"key":"1162_CR34","unstructured":"Ranjan, R., Castillo, C. D., & Chellappa, R. (2017). L2-constrained softmax loss for discriminative face verification. arXiv preprint arXiv:1703.09507 ."},{"key":"1162_CR35","unstructured":"Santoro, A., Bartunov, S., Botvinick, M., Wierstra, D., & Lillicrap, T. P. (2016). One-shot learning with memory-augmented neural networks. arXiv:1605.06065"},{"key":"1162_CR36","doi-asserted-by":"crossref","unstructured":"Schroff, F., Kalenichenko, D., & Philbin, J. (2015) Facenet: A unified embedding for face recognition and clustering. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 815\u2013823).","DOI":"10.1109\/CVPR.2015.7298682"},{"key":"1162_CR37","unstructured":"Simonyan, K., & Zisserman, A. (2014). Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:1409.1556 ."},{"key":"1162_CR38","doi-asserted-by":"crossref","unstructured":"Smirnov, E., Melnikov, A., Novoselov, S., Luckyanets, E., & Lavrentyeva, G. (2017). Doppelganger mining for face representation learning. In International conference on computer vision","DOI":"10.1109\/ICCVW.2017.226"},{"key":"1162_CR39","unstructured":"Sohn, K. (2016). Improved deep metric learning with multi-class n-pair loss objective. In Advances in neural information processing systems (pp. 1857\u20131865)."},{"key":"1162_CR40","doi-asserted-by":"crossref","unstructured":"Sun, C., Shrivastava, A., Singh, S. & Gupta, A. (2017). Revisiting unreasonable effectiveness of data in deep learning era. In 2017 IEEE international conference on computer vision (ICCV) (pp. 843\u2013852). IEEE.","DOI":"10.1109\/ICCV.2017.97"},{"key":"1162_CR41","unstructured":"Sun, Y., Chen, Y., Wang, X., & Tang, X. (2014). Deep learning face representation by joint identification-verification. In Advances in neural information processing systems (pp. 1988\u20131996)."},{"key":"1162_CR42","unstructured":"Sun, Y., Wang, X., & Tang, X. (2013). Deep learning face representation from predicting 10,000 classes. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 1891\u20131898)."},{"key":"1162_CR43","doi-asserted-by":"crossref","unstructured":"Szegedy, C., Liu, W., Jia, Y., Sermanet, P., Reed, S., Anguelov, D., Erhan, D., Vanhoucke, D. V., & Rabinovich, A. (2015). Going deeper with convolutions. In The IEEE conference on computer vision and pattern recognition (CVPR).","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"1162_CR44","doi-asserted-by":"crossref","unstructured":"Szegedy, C., Vanhoucke, V., Ioffe, S., Shlens, J., & Wojna, Z. (2016). Rethinking the inception architecture for computer vision. In Computer Vision and Pattern Recognition (pp. 2818\u20132826).","DOI":"10.1109\/CVPR.2016.308"},{"key":"1162_CR45","doi-asserted-by":"crossref","unstructured":"Tagami, Y. (2017). Annexml: Approximate nearest neighbor search for extreme multi-label classification. In Proceedings of the 23rd ACM SIGKDD international conference on knowledge discovery and data mining (pp. 455\u2013464). ACM.","DOI":"10.1145\/3097983.3097987"},{"key":"1162_CR46","doi-asserted-by":"crossref","unstructured":"Taigman, Y., Yang, M., Ranzato, M., & Wolf, L. (2013) Deepface: Closing the gap to human-level performance in face verification. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 1701\u20131708).","DOI":"10.1109\/CVPR.2014.220"},{"key":"1162_CR47","unstructured":"Taigman, Y., Yang, M., Ranzato, M., & Wolf, L. (2014). Web-scale training for face identification. arXiv preprint arXiv:1406.5266 ."},{"key":"1162_CR48","unstructured":"Vaswani, A., Zhao, Y., Fossum, V., & Chiang, D. (2013). Decoding with large-scale neural language models improves translation. In Proceedings of the 2013 conference on empirical methods in natural language processing (pp. 1387\u20131392)."},{"key":"1162_CR49","unstructured":"Vinyals, O., Blundell, C., Lillicrap, T. P., Kavukcuoglu, K., & Wierstra, D. (2016). Matching networks for one shot learning. In Neural information processing systems (pp. 3630\u20133638)."},{"key":"1162_CR50","unstructured":"Wang, C., Zhang, X., & Lan, X. (2017). How to train triplet networks with 100k identities? arXiv preprint arXiv:1709.02940 ."},{"key":"1162_CR51","doi-asserted-by":"publisher","first-page":"926","DOI":"10.1109\/LSP.2018.2822810","volume":"25","author":"F Wang","year":"2018","unstructured":"Wang, F., Liu, W., Liu, H., & Cheng, J. (2018a). Additive margin softmax for face verification. IEEE Signal Processing Letters, 25, 926\u2013930.","journal-title":"IEEE Signal Processing Letters"},{"key":"1162_CR52","doi-asserted-by":"crossref","unstructured":"Wang, F., Xiang, X., Cheng, J., & Yuille, A. L. (2017). Normface: $$ l\\_2 $$ l _ 2 hypersphere embedding for face verification. arXiv preprint arXiv:1704.06369","DOI":"10.1145\/3123266.3123359"},{"key":"1162_CR53","doi-asserted-by":"crossref","unstructured":"Wang, H., Wang, Y., Zhou, Z., Ji, X., & Liu, W. (2018b). Cosface: Large margin cosine loss for deep face recognition. In 2018 IEEE conference on computer vision and pattern recognition (CVPR). IEEE.","DOI":"10.1109\/CVPR.2018.00552"},{"key":"1162_CR54","volume-title":"Learning to learn: model regression networks for easy small sample learning","author":"YX Wang","year":"2016","unstructured":"Wang, Y. X., & Hebert, M. (2016). Learning to learn: model regression networks for easy small sample learning. Berlin: Springer."},{"key":"1162_CR55","doi-asserted-by":"crossref","unstructured":"Wen, Y., Zhang, K., Li, Z., & Qiao, Y. (2016). A discriminative feature learning approach for deep face recognition. In European conference on computer vision (pp. 499\u2013515). Springer.","DOI":"10.1007\/978-3-319-46478-7_31"},{"key":"1162_CR56","unstructured":"Weston, J., Chopra, S., & Bordes, A. (2014). Memory networks. arXiv preprint arXiv:1410.3916 ."},{"key":"1162_CR57","unstructured":"Wu, X., He, R., Sun, Z., & Tan, T. (2015). A light CNN for deep face representation with noisy labels. arXiv preprint arXiv:1511.02683 ."},{"key":"1162_CR58","doi-asserted-by":"crossref","unstructured":"Xu, C., Tao, D., & Xu, C. (2016). Robust extreme multi-label learning. In Proceedings of the 22nd ACM SIGKDD international conference on knowledge discovery and data mining (pp. 1275\u20131284). ACM.","DOI":"10.1145\/2939672.2939798"},{"key":"1162_CR59","unstructured":"Xu, Z., Zhu, L., & Yang, Y. (2016). Few-shot object recognition from machine-labeled web images. arXiv preprint arXiv:1612.06152 ."},{"key":"1162_CR60","doi-asserted-by":"crossref","unstructured":"Yang, J., Price, B., Cohen, S., & Yang, M. H. (2014). Context driven scene parsing with attention to rare classes. In IEEE conference on computer vision and pattern recognition (pp. 3294\u20133301).","DOI":"10.1109\/CVPR.2014.415"},{"key":"1162_CR61","unstructured":"Yi, D., Lei, Z., Liao, S., & Li, S. Z. (2014). Learning face representation from scratch. In Computer vision and pattern recognition"},{"key":"1162_CR62","unstructured":"Zhang, S., Zhu, X., Lei, Z., Shi, H., Wang, X., & Li, S. Z. (2017). Faceboxes: a CPU real-time face detector with high accuracy. arXiv preprint arXiv:1708.05234 ."},{"key":"1162_CR63","doi-asserted-by":"crossref","unstructured":"Zhang, X., Fang, Z., Wen, Y., Li, Z., & Qiao, Y. (2017). Range loss for deep face recognition with long-tailed training data. In The IEEE international conference on computer vision (ICCV).","DOI":"10.1109\/ICCV.2017.578"},{"key":"1162_CR64","unstructured":"Zhao, Y., Jin, Z., Qi, G., Lu, H., & Hua, X. (2018). A principled approach to hard triplet generation via adversarial nets. In European conference on computer vision."},{"key":"1162_CR65","unstructured":"Zhou, E., Cao, Z., & Yin, Q. (2015). Naive-deep face recognition: Touching the limit of LFW benchmark or not? arXiv preprint arXiv:1501.04690 ."}],"container-title":["International Journal of Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s11263-019-01162-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-019-01162-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-019-01162-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,9,12]],"date-time":"2022-09-12T01:00:08Z","timestamp":1662944408000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s11263-019-01162-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,2,16]]},"references-count":65,"journal-issue":{"issue":"6-7","published-print":{"date-parts":[[2019,6]]}},"alternative-id":["1162"],"URL":"https:\/\/doi.org\/10.1007\/s11263-019-01162-8","relation":{},"ISSN":["0920-5691","1573-1405"],"issn-type":[{"type":"print","value":"0920-5691"},{"type":"electronic","value":"1573-1405"}],"subject":[],"published":{"date-parts":[[2019,2,16]]},"assertion":[{"value":"16 February 2018","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"1 February 2019","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 February 2019","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}