{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,21]],"date-time":"2026-05-21T12:31:06Z","timestamp":1779366666798,"version":"3.53.0"},"reference-count":42,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2022,9,10]],"date-time":"2022-09-10T00:00:00Z","timestamp":1662768000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,9,10]],"date-time":"2022-09-10T00:00:00Z","timestamp":1662768000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100001659","name":"Deutsche Forschungsgemeinschaft","doi-asserted-by":"crossref","award":["388420599"],"award-info":[{"award-number":["388420599"]}],"id":[{"id":"10.13039\/501100001659","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Digit Libr"],"published-print":{"date-parts":[[2022,12]]},"DOI":"10.1007\/s00799-022-00337-y","type":"journal-article","created":{"date-parts":[[2022,9,10]],"date-time":"2022-09-10T13:02:36Z","timestamp":1662814956000},"page":"319-333","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["VIVA: visual information retrieval in video archives"],"prefix":"10.1007","volume":"23","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-7391-264X","authenticated-orcid":false,"given":"Markus","family":"M\u00fchling","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Nikolaus","family":"Korfhage","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Kader","family":"Pustu-Iren","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Joanna","family":"Bars","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Mario","family":"Knapp","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Hicham","family":"Bellafkir","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Markus","family":"Vogelbacher","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Daniel","family":"Schneider","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Angelika","family":"H\u00f6rth","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Ralph","family":"Ewerth","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Bernd","family":"Freisleben","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2022,9,10]]},"reference":[{"issue":"5","key":"337_CR1","doi-asserted-by":"publisher","first-page":"76","DOI":"10.3390\/jimaging7050076","volume":"7","author":"G Amato","year":"2021","unstructured":"Amato, G., Bolettieri, P., Carrara, F., Debole, F., Falchi, F., Gennaro, C., Vadicamo, L., Vairo, C.: The VISIONE video search system: exploiting off-the-shelf text search engines for large-scale video retrieval. J. Imaging 7(5), 76 (2021). https:\/\/doi.org\/10.3390\/jimaging7050076","journal-title":"J. Imaging"},{"key":"337_CR2","doi-asserted-by":"crossref","unstructured":"Amato, G., Falchi, F., Gennaro, C., Rabitti, F.: Searching and annotating 100m images with yfcc100m-hnfc6 and mi-file. In: Proceedings of the 15th International Workshop on Content-Based Multimedia Indexing. pp. 1\u20134 (2017)","DOI":"10.1145\/3095713.3095740"},{"key":"337_CR3","doi-asserted-by":"publisher","unstructured":"Andreadis, S., Moumtzidou, A., Gkountakos, K., Pantelidis, N., Apostolidis, K., Galanopoulos, D., Gialampoukidis, I., Vrochidis, S., Mezaris, V., Kompatsiaris, I.: VERGE in VBS 2021. In: Proceedings of the 27th International Conference on MultiMedia Modeling (MMM 2021). Lecture Notes in Computer Science, vol. 12573, pp. 398\u2013404. Springer (2021) https:\/\/doi.org\/10.1007\/978-3-030-67835-7_35","DOI":"10.1007\/978-3-030-67835-7_35"},{"key":"337_CR4","doi-asserted-by":"crossref","unstructured":"Cao, Q., Shen, L., Xie, W., Parkhi, O.M., Zisserman, A.: Vggface2: a dataset for recognising faces across pose and age. In: Proceedings of the 13th IEEE International Conference on Automatic Face and Gesture Recognition (FG 2018). pp. 67\u201374. IEEE (2018)","DOI":"10.1109\/FG.2018.00020"},{"key":"337_CR5","doi-asserted-by":"crossref","unstructured":"Deng, J., Dong, W., Socher, R., Li, L.J., Li, K., Fei-Fei, L.: Imagenet: a large-scale hierarchical image database. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. pp. 248\u2013255. IEEE (2009)","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"337_CR6","doi-asserted-by":"crossref","unstructured":"Deng, J., Guo, J., Xue, N., Zafeiriou, S.: ArcFace: additive angular margin loss for deep face recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 4690\u20134699. IEEE (2019)","DOI":"10.1109\/CVPR.2019.00482"},{"key":"337_CR7","doi-asserted-by":"crossref","unstructured":"Deng, J., Guo, J., Zhou, Y., Yu, J., Kotsia, I., Zafeiriou, S.: Retinaface: single-stage dense face localisation in the wild. arXiv preprint arXiv:1905.00641 (2019)","DOI":"10.1109\/CVPR42600.2020.00525"},{"issue":"1","key":"337_CR8","first-page":"1","volume":"20","author":"T Elsken","year":"2019","unstructured":"Elsken, T., Metzen, J.H., Hutter, F.: Neural architecture search: a survey. J. Mach. Learn. Res. 20(1), 1\u201321 (2019)","journal-title":"J. Mach. Learn. Res."},{"key":"337_CR9","doi-asserted-by":"publisher","unstructured":"Gasser, R., Rossetto, L., Schuldt, H.: Multimodal multimedia retrieval with vitrivr. In: Proceedings of the International Conference on Multimedia Retrieval (ICMR 2019). pp. 391\u2013394. ACM (2019). https:\/\/doi.org\/10.1145\/3323873.3326921","DOI":"10.1145\/3323873.3326921"},{"key":"337_CR10","doi-asserted-by":"crossref","unstructured":"Guo, Y., Zhang, L., Hu, Y., He, X., Gao, J.: MS-Celeb-1M: a dataset and benchmark for large-scale face recognition. In: Proceedings of 14th European Conference on Computer Vision. pp. 87\u2013102. Lecture Notes in Computer Science, Springer (2016)","DOI":"10.1007\/978-3-319-46487-9_6"},{"key":"337_CR11","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Delving deep into rectifiers: Surpassing human-level performance on imagenet classification. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1026\u20131034 (2015)","DOI":"10.1109\/ICCV.2015.123"},{"key":"337_CR12","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"337_CR13","doi-asserted-by":"publisher","unstructured":"Hu, B., Song, R., Wei, X., Yao, Y., Hua, X., Liu, Y.: PyRetri: A pytorch-based library for unsupervised image retrieval by deep convolutional neural networks. In: Proceedings of the 28th ACM International Conference on Multimedia. pp. 4461\u20134464. ACM (2020). https:\/\/doi.org\/10.1145\/3394171.3414537","DOI":"10.1145\/3394171.3414537"},{"issue":"1","key":"337_CR14","doi-asserted-by":"publisher","first-page":"117","DOI":"10.1109\/TPAMI.2010.57","volume":"33","author":"H Jegou","year":"2010","unstructured":"Jegou, H., Douze, M., Schmid, C.: Product quantization for nearest neighbor search. IEEE Trans. Pattern Anal. Mach. Intell. 33(1), 117\u2013128 (2010)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"3","key":"337_CR15","doi-asserted-by":"publisher","first-page":"535","DOI":"10.1109\/TBDATA.2019.2921572","volume":"7","author":"J Johnson","year":"2019","unstructured":"Johnson, J., Douze, M., J\u00e9gou, H.: Billion-scale similarity search with GPUs. IEEE Trans. Big Data 7(3), 535\u2013547 (2019)","journal-title":"IEEE Trans. Big Data"},{"issue":"2","key":"337_CR16","doi-asserted-by":"publisher","first-page":"291","DOI":"10.1002\/j.1538-7305.1970.tb01770.x","volume":"49","author":"BW Kernighan","year":"1970","unstructured":"Kernighan, B.W., Lin, S.: An efficient heuristic procedure for partitioning graphs. Bell Syst. Tech. J. 49(2), 291\u2013307 (1970)","journal-title":"Bell Syst. Tech. J."},{"key":"337_CR17","first-page":"1755","volume":"10","author":"DE King","year":"2009","unstructured":"King, D.E.: Dlib-ml: a machine learning toolkit. J. Mach. Learn. Res. 10, 1755\u20131758 (2009)","journal-title":"J. Mach. Learn. Res."},{"key":"337_CR18","unstructured":"Kingma, D.P., Ba, J.: Adam: A method for stochastic optimization. In: Proceedings of the 3rd International Conference on Learning Representations (ICLR) (2015)"},{"key":"337_CR19","doi-asserted-by":"crossref","unstructured":"Korfhage, N., M\u00fchling, M., Freisleben, B.: Intentional image similarity search. In: IAPR Workshop on Artificial Neural Networks in Pattern Recognition, pp. 23\u201335. Springer (2020)","DOI":"10.1007\/978-3-030-58309-5_2"},{"key":"337_CR20","doi-asserted-by":"crossref","unstructured":"Korfhage, N., M\u00fchling, M., Freisleben, B.: ElasticHash: semantic image similarity search by deep hashing with elasticsearch. In: Proceedings of the International Conference on Computer Analysis of Images and Patterns (CAIP). pp 14\u201323. Springer (2021)","DOI":"10.1007\/978-3-030-89131-2_2"},{"key":"337_CR21","doi-asserted-by":"publisher","unstructured":"Kratochv\u00edl, M., Mejzl\u00edk, F., Vesel\u00fd, P., Soucek, T., Lokoc, J.: SOMHunter: Lightweight video search system with SOM-guided relevance feedback. In: Proceedings of the 28th International Conference on Multimedia (MM). pp. 4481\u20134484. ACM (2020), https:\/\/doi.org\/10.1145\/3394171.3414542","DOI":"10.1145\/3394171.3414542"},{"issue":"7","key":"337_CR22","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s11263-020-01316-z","volume":"128","author":"A Kuznetsova","year":"2020","unstructured":"Kuznetsova, A., Rom, H., Alldrin, N., Uijlings, J., Krasin, I., Pont-Tuset, J., Kamali, S., Popov, S., Malloci, M., Kolesnikov, A., et al.: The open images dataset v4. Int. J. Comput. Vis. 128(7), 1\u201326 (2020)","journal-title":"Int. J. Comput. Vis."},{"key":"337_CR23","doi-asserted-by":"crossref","unstructured":"Lin, T.Y., Goyal, P., Girshick, R., He, K., Dollar, P.: Focal loss for dense object detection. In: Proceedings of the IEEE International Conference on Computer Vision (ICCV), pp. 2980\u20132988 (2017)","DOI":"10.1109\/ICCV.2017.324"},{"key":"337_CR24","doi-asserted-by":"crossref","unstructured":"Liu, C., Zoph, B., Neumann, M., Shlens, J., Hua, W., Li, L.J., Fei-Fei, L., Yuille, A., Huang, J., Murphy, K.: Progressive neural architecture search. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 19\u201334 (2018)","DOI":"10.1007\/978-3-030-01246-5_2"},{"key":"337_CR25","doi-asserted-by":"publisher","unstructured":"Lokoc, J., Schoeffmann, K., Bailer, W., Rossetto, L., Gurrin, C.: Interactive video retrieval in the age of deep learning. In: Proceedings of the International Conference on Multimedia Retrieval (ICMR), pp 2\u20134. ACM (2019). https:\/\/doi.org\/10.1145\/3323873.3326588","DOI":"10.1145\/3323873.3326588"},{"key":"337_CR26","unstructured":"M\u00fchling, M., Ewerth, R., Stadelmann, T., Z\u00f6fel, C., Shi, B., Freisleben, B.: University of Marburg at TRECVID 2007: shot boundary detection and high level feature extraction. In: TRECVID (2007)"},{"issue":"2","key":"337_CR27","doi-asserted-by":"publisher","first-page":"167","DOI":"10.1007\/s00799-018-0236-z","volume":"20","author":"M M\u00fchling","year":"2019","unstructured":"M\u00fchling, M., Meister, M., Korfhage, N., Wehling, J., H\u00f6rth, A., Ewerth, R., Freisleben, B.: Content-based video retrieval in historical collections of the German broadcasting archive. Int. J. Digit. Libr. 20(2), 167\u2013183 (2019)","journal-title":"Int. J. Digit. Libr."},{"key":"337_CR28","doi-asserted-by":"publisher","unstructured":"Nguyen, P.A., Wu, J., Ngo, C., Francis, D., Huet, B.: VIREO@ video browser showdown 2020. In: Proceedings of the 26th International Conference on MultiMedia Modeling (MMM). Lecture Notes in Computer Science, vol. 11962, pp. 772\u2013777. Springer (2020). https:\/\/doi.org\/10.1007\/978-3-030-37734-2_68","DOI":"10.1007\/978-3-030-37734-2_68"},{"key":"337_CR29","doi-asserted-by":"crossref","unstructured":"Norouzi, M., Punjani, A., Fleet, D.J.: Fast search in Hamming space with multi-index hashing. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR). pp. 3108\u20133115. IEEE (2012)","DOI":"10.1109\/CVPR.2012.6248043"},{"key":"337_CR30","doi-asserted-by":"crossref","unstructured":"Pustu-Iren, K., M\u00fchling, M., Korfhage, N., Bars, J., Bernh\u00f6ft, S., H\u00f6rth, A., Freisleben, B., Ewerth, R.: Investigating correlations of inter-coder agreement and machine annotation performance for historical video data. In: Proceedings of the International Conference on Theory and Practice of Digital Libraries, pp. 107\u2013114 (2019)","DOI":"10.1007\/978-3-030-30760-8_9"},{"issue":"7","key":"337_CR31","doi-asserted-by":"publisher","first-page":"5261","DOI":"10.1007\/s10462-020-09820-x","volume":"53","author":"J Rodrigues","year":"2020","unstructured":"Rodrigues, J., Cristo, M., Colonna, J.G.: Deep hashing for multi-label image retrieval: a survey. Artif. Intell. Rev. 53(7), 5261\u20135307 (2020)","journal-title":"Artif. Intell. Rev."},{"issue":"1\u20133","key":"337_CR32","doi-asserted-by":"publisher","first-page":"157","DOI":"10.1007\/s11263-007-0090-8","volume":"77","author":"BC Russell","year":"2008","unstructured":"Russell, B.C., Torralba, A., Murphy, K.P., Freeman, W.T.: LabelMe: a database and web-based tool for image annotation. Int. J. Comput. Vis. 77(1\u20133), 157\u2013173 (2008)","journal-title":"Int. J. Comput. Vis."},{"key":"337_CR33","doi-asserted-by":"crossref","unstructured":"Schroff, F., Kalenichenko, D., Philbin, J.: Facenet: A unified embedding for face recognition and clustering. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 815\u2013823 (2015)","DOI":"10.1109\/CVPR.2015.7298682"},{"issue":"12","key":"337_CR34","doi-asserted-by":"publisher","first-page":"1349","DOI":"10.1109\/34.895972","volume":"22","author":"AW Smeulders","year":"2000","unstructured":"Smeulders, A.W., Worring, M., Santini, S., Gupta, A., Jain, R.: Content-based image retrieval at the end of the early years. IEEE Trans. Pattern Anal. Mach. Intell. 22(12), 1349\u20131380 (2000)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"337_CR35","doi-asserted-by":"crossref","unstructured":"Szegedy, C., Liu, W., Jia, Y., Sermanet, P., Reed, S., Anguelov, D., Erhan, D., Vanhoucke, V., Rabinovich, A.: Going deeper with convolutions. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. pp. 1\u20139 (2015)","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"337_CR36","unstructured":"Tan, M., Le, Q.: EfficientNet: Rethinking model scaling for convolutional neural networks. In: Proceedings of the International Conference on Machine Learning. pp. 6105\u20136114 (2019)"},{"key":"337_CR37","doi-asserted-by":"crossref","unstructured":"Wang, H., Wang, Y., Zhou, Z., Ji, X., Gong, D., Zhou, J., Li, Z., Liu, W.: CosFace: Large margin cosine loss for deep face recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp 5265\u20135274. IEEE Computer Society (2018)","DOI":"10.1109\/CVPR.2018.00552"},{"key":"337_CR38","doi-asserted-by":"crossref","unstructured":"Wang, J., Yi, X., Guo, R., Jin, H., Xu, P., Li, S., Wang, X., Guo, X., Li, C., Xu, X., et\u00a0al.: Milvus: A purpose-built vector data management system. In: Proceedings of the International Conference on Management of Data, pp 2614\u20132627 (2021)","DOI":"10.1145\/3448016.3457550"},{"issue":"4","key":"337_CR39","doi-asserted-by":"publisher","first-page":"769","DOI":"10.1109\/TPAMI.2017.2699960","volume":"40","author":"J Wang","year":"2017","unstructured":"Wang, J., Zhang, T., Sebe, N., Shen, H.T., et al.: A survey on learning to hash. IEEE Trans. Pattern Anal. Mach. Intell. 40(4), 769\u2013790 (2017)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"1","key":"337_CR40","doi-asserted-by":"publisher","first-page":"34","DOI":"10.1109\/JPROC.2015.2487976","volume":"104","author":"J Wang","year":"2015","unstructured":"Wang, J., Liu, W., Kumar, S., Chang, S.F.: Learning to hash for indexing big data: a survey. Proc. IEEE 104(1), 34\u201357 (2015)","journal-title":"Proc. IEEE"},{"key":"337_CR41","unstructured":"Yeager, L., Bernauer, J., Gray, A., Houston, M.: Digits: the deep learning GPU training system. In: ICML 2015 AutoML Workshop (2015)"},{"issue":"6","key":"337_CR42","doi-asserted-by":"publisher","first-page":"1452","DOI":"10.1109\/TPAMI.2017.2723009","volume":"40","author":"B Zhou","year":"2017","unstructured":"Zhou, B., Lapedriza, A., Khosla, A., Oliva, A., Torralba, A.: Places: a 10 million image database for scene recognition. IEEE Trans. Pattern Anal. Mach. Intell. 40(6), 1452\u20131464 (2017)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."}],"container-title":["International Journal on Digital Libraries"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00799-022-00337-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00799-022-00337-y\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00799-022-00337-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,11,10]],"date-time":"2022-11-10T20:09:39Z","timestamp":1668110979000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00799-022-00337-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,9,10]]},"references-count":42,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2022,12]]}},"alternative-id":["337"],"URL":"https:\/\/doi.org\/10.1007\/s00799-022-00337-y","relation":{},"ISSN":["1432-5012","1432-1300"],"issn-type":[{"value":"1432-5012","type":"print"},{"value":"1432-1300","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,9,10]]},"assertion":[{"value":"15 March 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 June 2022","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"5 July 2022","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"10 September 2022","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}