{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,19]],"date-time":"2025-09-19T09:05:24Z","timestamp":1758272724805,"version":"3.40.4"},"publisher-location":"Cham","reference-count":29,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031758225"},{"type":"electronic","value":"9783031758232"}],"license":[{"start":{"date-parts":[[2024,10,25]],"date-time":"2024-10-25T00:00:00Z","timestamp":1729814400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,10,25]],"date-time":"2024-10-25T00:00:00Z","timestamp":1729814400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-75823-2_12","type":"book-chapter","created":{"date-parts":[[2024,10,24]],"date-time":"2024-10-24T20:33:24Z","timestamp":1729802004000},"page":"140-154","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Information Dissimilarity Measures in\u00a0Decentralized Knowledge Distillation: A Comparative Analysis"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-2096-1701","authenticated-orcid":false,"given":"Mbasa Joaquim","family":"Molo","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7182-7038","authenticated-orcid":false,"given":"Lucia","family":"Vadicamo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3643-5404","authenticated-orcid":false,"given":"Emanuele","family":"Carlini","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3715-149X","authenticated-orcid":false,"given":"Claudio","family":"Gennaro","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4734-8103","authenticated-orcid":false,"given":"Richard","family":"Connor","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,10,25]]},"reference":[{"unstructured":"Agarwala, A., Pennington, J., Dauphin, Y., Schoenholz, S.: Temperature check: theory and practice for training models with softmax-cross-entropy losses. arXiv preprint arXiv:2010.07344 (2020)","key":"12_CR1"},{"doi-asserted-by":"crossref","unstructured":"Aguilar, G., Ling, Y., Zhang, Y., Yao, B., Fan, X., Guo, C.: Knowledge distillation from internal representations. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol.\u00a034, pp. 7350\u20137357 (2020)","key":"12_CR2","DOI":"10.1609\/aaai.v34i05.6229"},{"key":"12_CR3","first-page":"22593","volume":"33","author":"I Bistritz","year":"2020","unstructured":"Bistritz, I., Mann, A., Bambos, N.: Distributed distillation for on-device learning. Adv. Neural. Inf. Process. Syst. 33, 22593\u201322604 (2020)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"doi-asserted-by":"crossref","unstructured":"Carta, A., Cossu, A., Lomonaco, V., Bacciu, D., van\u00a0de Weijer, J.: Projected latent distillation for data-agnostic consolidation in distributed continual learning. Neurocomputing 127935 (2024)","key":"12_CR4","DOI":"10.1016\/j.neucom.2024.127935"},{"doi-asserted-by":"crossref","unstructured":"Connor, R.: A tale of four metrics. In: 9th International Conference on Similarity Search and Applications, SISAP 2016, pp. 210\u2013217. Springer (2016)","key":"12_CR5","DOI":"10.1007\/978-3-319-46759-7_16"},{"doi-asserted-by":"crossref","unstructured":"Connor, R., Dearle, A., Claydon, B., Vadicamo, L.: Correlations of cross-entropy loss in machine learning. Entropy 26(6) (2024)","key":"12_CR6","DOI":"10.3390\/e26060491"},{"issue":"7","key":"12_CR7","doi-asserted-by":"publisher","first-page":"1857","DOI":"10.1007\/s11263-023-01792-z","volume":"131","author":"J Gou","year":"2023","unstructured":"Gou, J., Xiong, X., Yu, B., Du, L., Zhan, Y., Tao, D.: Multi-target knowledge distillation via student self-reflection. Int. J. Comput. Vis. 131(7), 1857\u20131874 (2023)","journal-title":"Int. J. Comput. Vis."},{"issue":"6","key":"12_CR8","doi-asserted-by":"publisher","first-page":"1789","DOI":"10.1007\/s11263-021-01453-z","volume":"129","author":"J Gou","year":"2021","unstructured":"Gou, J., Yu, B., Maybank, S.J., Tao, D.: Knowledge distillation: a survey. Int. J. Comput. Vis. 129(6), 1789\u20131819 (2021)","journal-title":"Int. J. Comput. Vis."},{"doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","key":"12_CR9","DOI":"10.1109\/CVPR.2016.90"},{"unstructured":"Hinton, G., Vinyals, O., Dean, J.: Distilling the knowledge in a neural network (2015)","key":"12_CR10"},{"doi-asserted-by":"crossref","unstructured":"Jeong, E., Kountouris, M.: Personalized decentralized federated learning with knowledge distillation. In: ICC 2023-IEEE International Conference on Communications, pp. 1982\u20131987. IEEE (2023)","key":"12_CR11","DOI":"10.1109\/ICC45041.2023.10279714"},{"issue":"2","key":"12_CR12","doi-asserted-by":"publisher","first-page":"567","DOI":"10.1109\/TPDS.2022.3225185","volume":"34","author":"H Jin","year":"2023","unstructured":"Jin, H., Bai, D., Yao, D., Dai, Y., Gu, L., Yu, C., Sun, L.: Personalized edge intelligence via federated self-knowledge distillation. IEEE Trans. Parallel Distrib. Syst. 34(2), 567\u2013580 (2023)","journal-title":"IEEE Trans. Parallel Distrib. Syst."},{"doi-asserted-by":"crossref","unstructured":"Kim, T., Oh, J., Kim, N., Cho, S., Yun, S.Y.: Comparing kullback-leibler divergence and mean squared error loss in knowledge distillation. arXiv preprint arXiv:2105.08919 (2021)","key":"12_CR13","DOI":"10.24963\/ijcai.2021\/362"},{"unstructured":"Krizhevsky, A., Nair, V., Hinton, G.: Cifar-10 (Canadian institute for advanced research) (2009)","key":"12_CR14"},{"key":"12_CR15","doi-asserted-by":"publisher","first-page":"1001","DOI":"10.1109\/OJCOMS.2023.3265425","volume":"4","author":"X Liu","year":"2023","unstructured":"Liu, X., Yu, J., Liu, Y., Gao, Y., Mahmoodi, T., Lambotharan, S., Tsang, D.H.K.: Distributed intelligence in wireless networks. IEEE Open J. Commun. Soc. 4, 1001\u20131039 (2023)","journal-title":"IEEE Open J. Commun. Soc."},{"key":"12_CR16","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2023.110480","volume":"268","author":"Y Luo","year":"2023","unstructured":"Luo, Y., Huang, Q., Ling, J., Lin, K., Zhou, T.: Local and global knowledge distillation with direction-enhanced contrastive learning for single-image deraining. Knowl. Based Syst. 268, 110480 (2023)","journal-title":"Knowl. Based Syst."},{"doi-asserted-by":"crossref","unstructured":"Markatou, M., Chen, Y., Afendras, G., Lindsay, B.G.: Statistical distances and their role in robustness. In: New Advances in Statistics and Data Science, pp. 3\u201326 (2017)","key":"12_CR17","DOI":"10.1007\/978-3-319-69416-0_1"},{"doi-asserted-by":"crossref","unstructured":"Mishra, R., Gupta, H.P.: Designing and training of lightweight neural networks on edge devices using early halting in knowledge distillation. IEEE Trans. Mobile Comput. (2023)","key":"12_CR18","DOI":"10.1109\/TMC.2023.3297026"},{"key":"12_CR19","first-page":"515","volume":"508","author":"MJ Molo","year":"2024","unstructured":"Molo, M.J., Carlini, E., Ciampi, L., Gennaro, C., Vadicamo, L.: Teacher-student models for AI vision at the edge: a car parking case study. Proceedings Copyright 508, 515 (2024)","journal-title":"Proceedings Copyright"},{"doi-asserted-by":"crossref","unstructured":"Moss, R., Connor, R.: A multi-way divergence metric for vector spaces. In: Similarity Search and Applications: 6th International Conference, SISAP 2013, A Coru\u00f1a, Spain, October 2\u20134, 2013, Proceedings 6, pp. 169\u2013174. Springer (2013)","key":"12_CR20","DOI":"10.1007\/978-3-642-41062-8_17"},{"issue":"2","key":"12_CR21","doi-asserted-by":"publisher","first-page":"221","DOI":"10.3390\/e22020221","volume":"22","author":"F Nielsen","year":"2020","unstructured":"Nielsen, F.: On a generalization of the Jensen-Shannon divergence and the Jensen-Shannon centroid. Entropy 22(2), 221 (2020)","journal-title":"Entropy"},{"doi-asserted-by":"crossref","unstructured":"Parker, L.E.: Distributed intelligence: overview of the field and its application in multi-robot systems. In: AAAI Fall Symposium: Regarding the Intelligence in Distributed Intelligent Systems, pp.\u00a01\u20136 (2007)","key":"12_CR22","DOI":"10.14198\/JoPha.2008.2.1.02"},{"key":"12_CR23","doi-asserted-by":"publisher","first-page":"16441","DOI":"10.1109\/ACCESS.2017.2739804","volume":"5","author":"Y Sahni","year":"2017","unstructured":"Sahni, Y., Cao, J., Zhang, S., Yang, L.: Edge mesh: a new paradigm to enable distributed intelligence in internet of things. IEEE Access 5, 16441\u201316458 (2017)","journal-title":"IEEE Access"},{"issue":"4","key":"12_CR24","doi-asserted-by":"publisher","first-page":"1602","DOI":"10.1109\/18.850703","volume":"46","author":"F Topsoe","year":"2000","unstructured":"Topsoe, F.: Some inequalities for information divergence and related measures of discrimination. IEEE Trans. Inf. Theory 46(4), 1602\u20131609 (2000)","journal-title":"IEEE Trans. Inf. Theory"},{"doi-asserted-by":"crossref","unstructured":"Tung, F., Mori, G.: Similarity-preserving knowledge distillation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 1365\u20131374 (2019)","key":"12_CR25","DOI":"10.1109\/ICCV.2019.00145"},{"key":"12_CR26","doi-asserted-by":"publisher","first-page":"599","DOI":"10.1109\/TPAMI.1985.4767707","volume":"5","author":"AK Wong","year":"1985","unstructured":"Wong, A.K., You, M.: Entropy and distance of random graphs with application to structural pattern recognition. IEEE Trans. Pattern Anal. Mach. Intell. 5, 599\u2013609 (1985)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"doi-asserted-by":"crossref","unstructured":"Yang, Z., Zeng, A., Li, Z., Zhang, T., Yuan, C., Li, Y.: From knowledge distillation to self-knowledge distillation: a unified approach with normalized loss and customized soft labels. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 17185\u201317194 (2023)","key":"12_CR27","DOI":"10.1109\/ICCV51070.2023.01576"},{"doi-asserted-by":"crossref","unstructured":"Zhmoginov, A., Sandler, M., Miller, N., Kristiansen, G., Vladymyrov, M.: Decentralized learning with multi-headed distillation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 8053\u20138063 (2023)","key":"12_CR28","DOI":"10.1109\/CVPR52729.2023.00778"},{"unstructured":"Zhou, B., Lapedriza, A., Xiao, J., Torralba, A., Oliva, A.: Learning deep features for scene recognition using places database. Adv. Neural Inf. Process. Syst. 27 (2014)","key":"12_CR29"}],"container-title":["Lecture Notes in Computer Science","Similarity Search and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-75823-2_12","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,23]],"date-time":"2025-04-23T17:05:43Z","timestamp":1745427943000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-75823-2_12"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,10,25]]},"ISBN":["9783031758225","9783031758232"],"references-count":29,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-75823-2_12","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2024,10,25]]},"assertion":[{"value":"25 October 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"SISAP","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Similarity Search and Applications","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Providence, RI","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"USA","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"5 November 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"7 November 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"17","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"sisap2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/www.sisap.org\/2024\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}