{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,29]],"date-time":"2026-04-29T06:45:49Z","timestamp":1777445149498,"version":"3.51.4"},"reference-count":212,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,7,26]],"date-time":"2025-07-26T00:00:00Z","timestamp":1753488000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2025,7,26]],"date-time":"2025-07-26T00:00:00Z","timestamp":1753488000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Big Data"],"DOI":"10.1186\/s40537-025-01227-1","type":"journal-article","created":{"date-parts":[[2025,7,26]],"date-time":"2025-07-26T07:58:41Z","timestamp":1753516721000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["A guide to similarity measures and their data science applications"],"prefix":"10.1186","volume":"12","author":[{"given":"Avivit","family":"Levy","sequence":"first","affiliation":[]},{"given":"B. Riva","family":"Shalom","sequence":"additional","affiliation":[]},{"given":"Michal","family":"Chalamish","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,7,26]]},"reference":[{"issue":"3","key":"1227_CR1","first-page":"264","volume":"8","author":"L AbdAllah","year":"2013","unstructured":"AbdAllah L, Shimshoni I. An ensemble-clustering-based distance metric and its applications. Int J Bus Intell Data Min. 2013;8(3):264\u201387.","journal-title":"Int J Bus Intell Data Min"},{"key":"1227_CR2","doi-asserted-by":"publisher","first-page":"128","DOI":"10.1016\/j.procs.2021.05.076","volume":"189","author":"S Agarwala","year":"2021","unstructured":"Agarwala S, Anagawadi A, Guddeti R. Detecting semantic similarity of documents using natural language processing. Proc Comput Sci. 2021;189:128\u201335.","journal-title":"Proc Comput Sci"},{"key":"1227_CR3","doi-asserted-by":"crossref","unstructured":"Akash PS, Kadir ME, Ali AA, Shoyaib M. Inter-node hellinger distance based decision tree. In Proc. of the 28th International Joint Conference on Artificial Intelligence. 2019; 1967\u20131973.","DOI":"10.24963\/ijcai.2019\/272"},{"issue":"5","key":"1227_CR4","doi-asserted-by":"publisher","first-page":"305","DOI":"10.1016\/0020-0190(86)90091-8","volume":"23","author":"L Allison","year":"1986","unstructured":"Allison L, Dix TI. A bit-string longest-common-subsequence algorithm. Inf Process Lett. 1986;23(5):305\u201310.","journal-title":"Inf Process Lett"},{"issue":"7","key":"1227_CR5","first-page":"6185","volume":"35","author":"L Amgoud","year":"2021","unstructured":"Amgoud L, David V. A general setting for gradual semantics dealing with similarity. Proc AAAI Conf Artif Intell. 2021;35(7):6185\u201392.","journal-title":"Proc AAAI Conf Artif Intell"},{"issue":"6","key":"1227_CR6","doi-asserted-by":"publisher","first-page":"359","DOI":"10.1016\/j.jcss.2009.03.001","volume":"75","author":"A Amir","year":"2009","unstructured":"Amir A, Aumann Y, Benson G, Levy A, Lipsky O, Porat E, Skiena S, Vishne U. Pattern matching with address errors: rearrangement distances. J Comput Syst Sci. 2009;75(6):359\u201370.","journal-title":"J Comput Syst Sci"},{"issue":"43","key":"1227_CR7","doi-asserted-by":"publisher","first-page":"4382","DOI":"10.1016\/j.tcs.2009.07.019","volume":"410","author":"A Amir","year":"2009","unstructured":"Amir A, Aumann Y, Indyk P, Levy A, Porat E. Efficient computations of $$\\ell _1$$ and $$\\ell _{\\infty }$$ rearrangement distances. Theor Comput Sci. 2009;410(43):4382\u201390.","journal-title":"Theor Comput Sci"},{"issue":"3","key":"1227_CR8","doi-asserted-by":"publisher","first-page":"273","DOI":"10.1016\/j.jda.2010.02.001","volume":"8","author":"A Amir","year":"2010","unstructured":"Amir A, Gotthilf Z, Shalom BR. Weighted LCS. J Discret Algorithm. 2010;8(3):273\u201381.","journal-title":"J Discret Algorithm"},{"issue":"4","key":"1227_CR9","doi-asserted-by":"publisher","first-page":"1444","DOI":"10.1137\/080712969","volume":"39","author":"A Amir","year":"2009","unstructured":"Amir A, Hartman T, Kapah O, Levy A, Porat E. On the cost of interchange rearrangement in strings. SIAM J Comput (SICOMP). 2009;39(4):1444\u201361.","journal-title":"SIAM J Comput (SICOMP)"},{"issue":"3","key":"1227_CR10","doi-asserted-by":"publisher","first-page":"438","DOI":"10.1016\/j.tcs.2008.08.037","volume":"409","author":"A Amir","year":"2008","unstructured":"Amir A, Hartman T, Oren Kapah B, Shalom R, Tsur D. Generalized lcs. Theor Comput Sci. 2008;409(3):438\u201349.","journal-title":"Theor Comput Sci"},{"key":"1227_CR11","first-page":"1","volume-title":"Algorithms and applications","author":"A Amir","year":"2010","unstructured":"Amir A, Levy A. String rearrangement metrics: a survey. In: Elomaa T, Mannila H, Orponen P, editors. Algorithms and applications. Berlin: Springer; 2010. p. 1\u201333."},{"issue":"2","key":"1227_CR12","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1016\/S0196-6774(03)00097-X","volume":"50","author":"A Amir","year":"2004","unstructured":"Amir A, Lewenstein M, Porat E. Faster algorithms for string matching with k mismatches. J Algorithm. 2004;50(2):257\u201375.","journal-title":"J Algorithm"},{"key":"1227_CR13","doi-asserted-by":"crossref","unstructured":"Apostolico A, Landau GM, Skiena S. Matching for run-length encoded strings. In: Proc. Compression and Complexity of SEQUENCES. 1997; 348\u2013356.","DOI":"10.1109\/SEQUEN.1997.666929"},{"issue":"1","key":"1227_CR14","doi-asserted-by":"publisher","first-page":"100","DOI":"10.17694\/bajece.1212563","volume":"11","author":"I Atas","year":"2023","unstructured":"Atas I. Performance evaluation of Jaccard-dice coefficient on building segmentation from high resolution satellite images. Balkan J Electr Comput Eng. 2023;11(1):100\u20136.","journal-title":"Balkan J Electr Comput Eng"},{"issue":"04","key":"1227_CR15","first-page":"3219","volume":"34","author":"Y Bai","year":"2020","unstructured":"Bai Y, Ding H, Ken G, Sun Y, Wang W. Learning-based efficient graph similarity computation via multi-scale convolutional set matching. Proc AAAI Conf Artif Intell. 2020;34(04):3219\u201326.","journal-title":"Proc AAAI Conf Artif Intell"},{"key":"1227_CR16","unstructured":"Bara J, Lev O, Turrini P. Predicting voting outcomes in presence of communities. In Proc. of the 20th International Conference on Autonomous Agents and MultiAgent Systems. 2021; 151\u2013159."},{"key":"1227_CR17","unstructured":"Barr\u00f3n-Cede\u00f1o A, Rosso P, Agirre E, Labaka G. Plagiarism detection across distant language pairs. In the 23rd International Conference on Computational Linguistics. 2010; 37\u201345."},{"issue":"12","key":"1227_CR18","doi-asserted-by":"publisher","first-page":"882","DOI":"10.1007\/s11018-023-02180-2","volume":"65","author":"AN Bazhenov","year":"2023","unstructured":"Bazhenov AN, Telnova AY. Generalization of Jaccard index for interval data analysis. Meas Tech. 2023;65(12):882\u201390.","journal-title":"Meas Tech"},{"key":"1227_CR19","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1016\/j.tcs.2015.11.026","volume":"638","author":"G Benson","year":"2016","unstructured":"Benson G, Levy A, Maimoni S, Noifeld D, Riva Shalom B. LCSk: a refined similarity measure. Theor Comput Sci. 2016;638:11\u201326.","journal-title":"Theor Comput Sci"},{"key":"1227_CR20","doi-asserted-by":"crossref","unstructured":"Bergroth L, Hakonen H, Raita T. A survey of longest common subsequence algorithms. In Proc. 7th Symposium on String Processing and Information Retrieval. 2000; 39\u201348.","DOI":"10.1109\/SPIRE.2000.878178"},{"key":"1227_CR21","doi-asserted-by":"publisher","first-page":"87","DOI":"10.1016\/j.autcon.2017.12.036","volume":"88","author":"M Bermudez-Edo","year":"2018","unstructured":"Bermudez-Edo M, Barnaghi P, Moessner K. Analysing real world data streams with spatio-temporal correlations: Entropy vs. Pearson correlation. Autom Constr. 2018;88:87\u2013100.","journal-title":"Autom Constr"},{"key":"1227_CR22","doi-asserted-by":"crossref","unstructured":"Bertels J, Eelbode T, Berman M, Vandermeulen D, Maes F, Bisschops R, Blaschko MB. Optimizing the dice score and jaccard index for medical image segmentation: Theory and practice. In Medical Image Computing and Computer Assisted Intervention\u2013MICCAI 2019: 22nd International Conference, Shenzhen, China, October 13\u201317, 2019, Proceedings, Part II 22. 2019; 92\u2013100.","DOI":"10.1007\/978-3-030-32245-8_11"},{"key":"1227_CR23","first-page":"99","volume":"35","author":"AK Bhattacharyya","year":"1943","unstructured":"Bhattacharyya AK. On a measure of divergence between two statistical populations defined by their probability distributions. Bull Calcutta Math Soc. 1943;35:99\u2013109.","journal-title":"Bull Calcutta Math Soc"},{"key":"1227_CR24","doi-asserted-by":"crossref","unstructured":"Boneh I, Golan S, Levy A, Porat E, Shalom BR. Burst edit distance. In Zsuzsanna Lipt\u00e1k, Edleno\u00a0Silva de\u00a0Moura, Karina Figueroa, and Ricardo Baeza-Yates, editors, String Processing and Information Retrieval - 31st International Symposium, SPIRE 2024, Puerto Vallarta, Mexico, September 23-25, 2024, Proceedings, volume 14899 of Lecture Notes in Computer Science. Springer; 2024. 41\u201356.","DOI":"10.1007\/978-3-031-72200-4_4"},{"key":"1227_CR25","doi-asserted-by":"publisher","first-page":"123","DOI":"10.1023\/A:1018054314350","volume":"24","author":"L Breiman","year":"1996","unstructured":"Breiman L. Bagging predictors. Mach Learn. 1996;24:123\u201340.","journal-title":"Mach Learn"},{"key":"1227_CR26","doi-asserted-by":"crossref","unstructured":"Brown PO, Chiang MC, Guo S, Jin Y, Leung CK, Murray EL, Pazdor AGM, Cuzzocrea A. Mahalanobis distance based k-means clustering. In International Conference on Big Data Analytics and Knowledge Discovery. Springer; 2022. 256\u2013262.","DOI":"10.1007\/978-3-031-12670-3_23"},{"key":"1227_CR27","volume-title":"Big data: principles and paradigms","author":"R Buyya","year":"2016","unstructured":"Buyya R, Calheiros RN, Dastjerdi AV. Big data: principles and paradigms. Burlington: Morgan Kaufmann; 2016."},{"key":"1227_CR28","first-page":"527","volume":"34","author":"A Cayley","year":"1849","unstructured":"Cayley A. Note on the theory of permutations. Phil Mag. 1849;34:527\u20139.","journal-title":"Phil Mag"},{"key":"1227_CR29","first-page":"300","volume":"1","author":"S-H Cha","year":"2007","unstructured":"Cha S-H. Comprehensive survey on distance\/similarity measures between probability density functions. Int J Math Models Methods Appl Sci. 2007;1:300\u20137.","journal-title":"Int J Math Models Methods Appl Sci"},{"issue":"6","key":"1227_CR30","doi-asserted-by":"publisher","first-page":"1355","DOI":"10.1016\/S0031-3203(01)00118-2","volume":"35","author":"S-H Cha","year":"2002","unstructured":"Cha S-H, Srihari SN. On measuring the distance between histograms. Pattern Recogn. 2002;35(6):1355\u201370.","journal-title":"Pattern Recogn"},{"key":"1227_CR31","doi-asserted-by":"crossref","unstructured":"Chen T, Guestrin C. Xgboost: A scalable tree boosting system. In Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, KDD \u201916, New York, NY, USA, Association for Computing Machinery; 2016. 785\u2013794.","DOI":"10.1145\/2939672.2939785"},{"key":"1227_CR32","doi-asserted-by":"crossref","unstructured":"Chikodili NB, Abdulmalik MD, Abisoye OA, Bashir SA. Outlier detection in multivariate time series data using a fusion of k-medoid, standardized euclidean distance and z-score. In International Conference on Information and Communication Technology and Applications. Springer; 2020. 259\u2013271.","DOI":"10.1007\/978-3-030-69143-1_21"},{"key":"1227_CR33","doi-asserted-by":"crossref","unstructured":"Chopra S, Hadsell R, LeCun Y. Learning a similarity metric discriminatively, with application to face verification. In 2005 IEEE Computer Society Conference on Computer Vision and Pattern Recognition (CVPR\u201905). 2005; 1: 539\u2013546.","DOI":"10.1109\/CVPR.2005.202"},{"key":"1227_CR34","doi-asserted-by":"publisher","first-page":"136","DOI":"10.1007\/s10618-011-0222-1","volume":"24","author":"DA Cieslak","year":"2012","unstructured":"Cieslak DA, Hoens TR, Chawla NV, Kegelmeyer WP. Hellinger distance decision trees are robust and skew-insensitive. Data Min Knowl Discov. 2012;24:136\u201358.","journal-title":"Data Min Knowl Discov"},{"issue":"4","key":"1227_CR35","first-page":"445","volume":"35","author":"PJ Clark","year":"1954","unstructured":"Clark PJ, Evans FC. Distance to nearest neighbor as a measure of spatial relationships in populations. Ecol Ecol Soc Am. 1954;35(4):445\u201353.","journal-title":"Ecol Ecol Soc Am"},{"key":"1227_CR36","doi-asserted-by":"crossref","unstructured":"Clifford R, Fontaine A, Porat E, Sach B, Starikovskaya T. The k-mismatch problem revisited. In Proc. of the 27th Annual ACM-SIAM Symposium on Discrete Algorithms. 2016; 2039\u20132052.","DOI":"10.1137\/1.9781611974331.ch142"},{"key":"1227_CR37","unstructured":"Clifford R, Gawrychowski P, Kociumaka T, Martin DP, Uzna\u0144ski P. The dynamic k-mismatch problem. In 33rd Annual Symposium on Combinatorial Pattern Matching. 2022;223:18:1-18:15."},{"key":"1227_CR38","doi-asserted-by":"publisher","first-page":"448","DOI":"10.1016\/j.procs.2018.10.144","volume":"141","author":"A Clim","year":"2018","unstructured":"Clim A, Zota RD, TinicA G. The Kullback-Leibler divergence used in machine learning algorithms for health care applications and hypertension prediction: a literature review. Proc Comput Sci. 2018;141:448\u201353.","journal-title":"Proc Comput Sci"},{"key":"1227_CR39","first-page":"10554","volume":"36","author":"P Colombo","year":"2022","unstructured":"Colombo P, Clavel C, Piantanida P. Infolm: a new metric to evaluate summarization and data2text generation. Proc AAAI Conf Artif Intell. 2022;36:10554\u201362.","journal-title":"Proc AAAI Conf Artif Intell"},{"key":"1227_CR40","doi-asserted-by":"crossref","unstructured":"Connor R, Simeoni F, Iakovos M. Structural entropic difference: A bounded distance metric for unordered trees. In Second International Workshop on Similarity Search and Applications. 2009;21\u201329.","DOI":"10.1109\/SISAP.2009.29"},{"key":"1227_CR41","doi-asserted-by":"publisher","first-page":"122","DOI":"10.1016\/j.ins.2012.11.012","volume":"229","author":"I Couso","year":"2013","unstructured":"Couso I, Garrido L, S\u00e1nchez L. Similarity and dissimilarity measures between fuzzy sets: a formal relational study. Inf Sci. 2013;229:122\u201341.","journal-title":"Inf Sci"},{"key":"1227_CR42","doi-asserted-by":"publisher","first-page":"315","DOI":"10.1007\/978-3-540-33037-0_14","volume-title":"Multidimensional scaling, handbook of data visualization","author":"MAA Cox","year":"2008","unstructured":"Cox MAA, Cox TF. Multidimensional scaling, handbook of data visualization. Berlin: Springer; 2008. p. 315\u201347."},{"key":"1227_CR43","first-page":"2292","volume":"26","author":"M Cuturi","year":"2013","unstructured":"Cuturi M. Sinkhorn distances: lightspeed computation of optimal transport. Adv Neural Inf Process Syst. 2013;26:2292\u2013300.","journal-title":"Adv Neural Inf Process Syst"},{"issue":"3","key":"1227_CR44","doi-asserted-by":"publisher","first-page":"171","DOI":"10.1145\/363958.363994","volume":"7","author":"FJ Damerau","year":"1964","unstructured":"Damerau FJ. A technique for computer detection and correction of spelling errors. Commun ACM. 1964;7(3):171\u20136.","journal-title":"Commun ACM"},{"key":"1227_CR45","doi-asserted-by":"crossref","unstructured":"Dar G, Geva M, Gupta A, Berant J. Analyzing transformers in embedding space. In Anna Rogers, Jordan\u00a0L. Boyd-Graber, and Naoaki Okazaki, editors, Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), ACL 2023, Toronto, Canada. Association for Computational Linguistics July 9-14, 2023; 16124\u201316170.","DOI":"10.18653\/v1\/2023.acl-long.893"},{"key":"1227_CR46","doi-asserted-by":"crossref","unstructured":"Das D, Gilbert J, Hajiaghayi M, Kociumaka T, Saha B. Weighted edit distance computation: Strings, trees, and dyck. In Proceedings of the 55th Annual ACM Symposium on Theory of Computing. 2023; 377\u2013390.","DOI":"10.1145\/3564246.3585178"},{"key":"1227_CR47","doi-asserted-by":"crossref","unstructured":"Deng J, Guo J, Xue N, Zafeiriou S. Arcface: Additive angular margin loss for deep face recognition. In Proc. of the IEEE\/CVF conference on computer vision and pattern recognition. 2019;4690\u20134699.","DOI":"10.1109\/CVPR.2019.00482"},{"key":"1227_CR48","unstructured":"Dey P, Medya S. Manipulating node similarity measures in networks. In Proc. of the 19th International Conference on Autonomous Agents and Multiagent Systems. 2020;321\u2013329."},{"key":"1227_CR49","volume-title":"Dictionary of distances","author":"E Deza","year":"2006","unstructured":"Deza E, Deza M-M. Dictionary of distances. Amsterdam: Elsevier; 2006."},{"key":"1227_CR50","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-00234-2","volume-title":"Encyclopedia of distances","author":"MM Deza","year":"2009","unstructured":"Deza MM, Deza E. Encyclopedia of distances. Berlin: Springer; 2009."},{"issue":"3","key":"1227_CR51","doi-asserted-by":"publisher","first-page":"297","DOI":"10.2307\/1932409","volume":"26","author":"LR Dice","year":"1945","unstructured":"Dice LR. Measures of the amount of ecologic association between species. Ecology. 1945;26(3):297\u2013302.","journal-title":"Ecology"},{"key":"1227_CR52","volume-title":"Pattern classification","author":"RO Duda","year":"2001","unstructured":"Duda RO, Hart PE, Stork DG. Pattern classification. Hoboken: Wiley; 2001."},{"issue":"11","key":"1227_CR53","doi-asserted-by":"publisher","first-page":"3679","DOI":"10.1109\/TMI.2020.3002417","volume":"39","author":"T Eelbode","year":"2020","unstructured":"Eelbode T, Bertels J, Berman M, Vandermeulen D, Maes F, Bisschops R, Blaschko MB. Optimization for medical image segmentation: theory and practice when evaluating with dice score or Jaccard index. IEEE Trans Med Imaging. 2020;39(11):3679\u201390.","journal-title":"IEEE Trans Med Imaging"},{"key":"1227_CR54","doi-asserted-by":"crossref","unstructured":"Ehara Y. Analyzing similarities between word frequency distributions of various corpora to find effective features for complex word identification. In 2019 International Conference on Data Mining Workshops (ICDMW). IEEE; 2019. 1\u20134.","DOI":"10.1109\/ICDMW48858.2019.9024753"},{"key":"1227_CR55","doi-asserted-by":"publisher","first-page":"19","DOI":"10.1002\/qre.441","volume":"18","author":"SM Emran","year":"2002","unstructured":"Emran SM, Ye N. Robustness of Chi-square and Canberra distance metrics for computer intrusion detection. Qual Reliab Eng Int. 2002;18:19.","journal-title":"Qual Reliab Eng Int"},{"key":"1227_CR56","doi-asserted-by":"publisher","first-page":"012112","DOI":"10.1088\/1742-6596\/1566\/1\/012112","volume":"1566","author":"M Faisal","year":"2020","unstructured":"Faisal M, Zamzami EM, et al. Comparative analysis of inter-centroid k-means performance using Euclidean distance, Canberra distance and Manhattan distance. J Phys Conf Ser. 2020;1566:012112.","journal-title":"J Phys Conf Ser"},{"key":"1227_CR57","unstructured":"Fisman D, Grogin J, Margalit O, Weiss G. The normalized edit distance with uniform operation costs is a metric. In 33rd Annual Symposium on Combinatorial Pattern Matching. 2022;223:17:1\u201317:17."},{"key":"1227_CR58","first-page":"1","volume":"22","author":"S Fletcher","year":"2018","unstructured":"Fletcher S, Islam MZ, et al. Comparing sets of patterns with the Jaccard index. Australas J Inf Syst. 2018;22:1.","journal-title":"Australas J Inf Syst"},{"key":"1227_CR59","unstructured":"Freund Y, Schapire RE. Experiments with a new boosting algorithm. In Proceedings of the Thirteenth International Conference on International Conference on Machine Learning, ICML\u201996. San Francisco, CA, USA, Morgan Kaufmann Publishers Inc; 1996. 148\u2013156."},{"issue":"1","key":"1227_CR60","doi-asserted-by":"publisher","first-page":"119","DOI":"10.1006\/jcss.1997.1504","volume":"55","author":"Y Freund","year":"1997","unstructured":"Freund Y, Schapire RE. A decision-theoretic generalization of on-line learning and an application to boosting. J Comput Syst Sci. 1997;55(1):119\u201339.","journal-title":"J Comput Syst Sci"},{"issue":"5","key":"1227_CR61","doi-asserted-by":"publisher","first-page":"1189","DOI":"10.1214\/aos\/1013203451","volume":"29","author":"JH Friedman","year":"2001","unstructured":"Friedman JH. Greedy function approximation: a gradient boosting machine. Ann Stat. 2001;29(5):1189\u2013232.","journal-title":"Ann Stat"},{"issue":"11","key":"1227_CR62","doi-asserted-by":"publisher","first-page":"7005","DOI":"10.1007\/s10115-024-02177-5","volume":"66","author":"VR Ganji","year":"2024","unstructured":"Ganji VR, Chaparala A. Wave hedges distance-based feature fusion and hybrid optimization-enabled deep learning for cyber credit card fraud detection. Knowl Inf Syst. 2024;66(11):7005\u201330.","journal-title":"Knowl Inf Syst"},{"key":"1227_CR63","doi-asserted-by":"crossref","unstructured":"Gao J, Gao J. A similarity measurement method based on graph kernel for disconnected graphs. In Proc. of the 28th International Joint Conference on Artificial Intelligence. 2019;6430\u20136431.","DOI":"10.24963\/ijcai.2019\/904"},{"issue":"5","key":"1227_CR64","doi-asserted-by":"publisher","first-page":"648","DOI":"10.1191\/0959683605hl841rp","volume":"15","author":"DG Gavin","year":"2005","unstructured":"Gavin DG, Brubaker LB, McLachlan JS, Oswald WW. Correspondence of pollen assemblages with forest zones across steep environmental gradients, Olympic Peninsula, Washington, USA. Holocene. 2005;15(5):648\u201362.","journal-title":"Holocene"},{"key":"1227_CR65","doi-asserted-by":"publisher","first-page":"356","DOI":"10.1016\/S0033-5894(03)00088-7","volume":"60","author":"DG Gavin","year":"2003","unstructured":"Gavin DG, Oswald WW, Wahl ER, Williams JW. A statistical approach to evaluating distance metrics and analog assignments for pollen records. Quat Res. 2003;60:356\u201367.","journal-title":"Quat Res"},{"key":"1227_CR66","first-page":"22","volume":"123","author":"O Gavrilenko","year":"2023","unstructured":"Gavrilenko O, Khomenko O, Zhurakovska O, Kohan A, Matviichuk R, Piskun A, Khavikova Y. Establishing the grouping principle of public services based on the analysis of similarity coefficients. East Eur J Enterp Technol. 2023;123:22\u20139.","journal-title":"East Eur J Enterp Technol"},{"key":"1227_CR67","unstructured":"Gawrychowski P, Uzna\u0144ski P. Towards unified approximate pattern matching for Hamming and $$L_1$$ distance. In 45th International Colloquium on Automata, Languages, and Programming. 2018;107: 62:1\u201362:13."},{"key":"1227_CR68","first-page":"583","volume":"34","author":"H Ghorbani","year":"2019","unstructured":"Ghorbani H. Mahalanobis distance and its application for detecting multivariate outliers. Facta Univ Ser Math Inform. 2019;34:583\u201395.","journal-title":"Facta Univ Ser Math Inform"},{"key":"1227_CR69","doi-asserted-by":"publisher","first-page":"444","DOI":"10.1093\/biomet\/48.3-4.444","volume":"48","author":"GJ Glasser","year":"1961","unstructured":"Glasser GJ, Winter RF. Critical values of the coefficient of rank correlation for testing the hypothesis of independance. Biometrika. 1961;48:444\u20138.","journal-title":"Biometrika"},{"key":"1227_CR70","doi-asserted-by":"publisher","first-page":"205","DOI":"10.1016\/j.inffus.2020.07.007","volume":"64","author":"S Gonz\u00e1lez","year":"2020","unstructured":"Gonz\u00e1lez S, Garc\u00eda S, Del Ser J, Rokach L, Herrera F. A practical tutorial on bagging and boosting based ensembles for machine learning: algorithms, software tools, performance study, practical perspectives and opportunities. Inf Fusion. 2020;64:205\u201337.","journal-title":"Inf Fusion"},{"key":"1227_CR71","doi-asserted-by":"publisher","first-page":"146","DOI":"10.1016\/j.ins.2012.05.028","volume":"218","author":"V Gonz\u00e1lez-Castro","year":"2013","unstructured":"Gonz\u00e1lez-Castro V, Alaiz-Rodr\u00edguez R, Alegre E. Class distribution estimation based on the hellinger distance. Inf Sci. 2013;218:146\u201364.","journal-title":"Inf Sci"},{"key":"1227_CR72","doi-asserted-by":"crossref","unstructured":"Gotthilf Z, Hermelin D, Landau GM, Lewenstein M. Restricted LCS. In Proc. of the 17th International Conference on String Processing and Information Retrieval. 2010;250\u2013257.","DOI":"10.1007\/978-3-642-16321-0_26"},{"issue":"4","key":"1227_CR73","doi-asserted-by":"publisher","first-page":"857","DOI":"10.2307\/2528823","volume":"27","author":"JC Gower","year":"1971","unstructured":"Gower JC. A general coefficient of similarity and some of its properties. Biometrics. 1971;27(4):857\u201371.","journal-title":"Biometrics"},{"key":"1227_CR74","volume-title":"A guide to chi-squared testing","author":"PE Greenwood","year":"1996","unstructured":"Greenwood PE, Nikulin MS. A guide to chi-squared testing. New York: Wiley; 1996."},{"issue":"5","key":"1227_CR75","doi-asserted-by":"publisher","first-page":"123","DOI":"10.21468\/SciPostPhys.16.5.123","volume":"16","author":"G Grosso","year":"2024","unstructured":"Grosso G, Letizia M, Pierini M, Wulzer A. Goodness of fit by Neyman-Pearson testing. SciPost Phys. 2024;16(5):123.","journal-title":"SciPost Phys"},{"issue":"1","key":"1227_CR76","doi-asserted-by":"publisher","first-page":"012092","DOI":"10.1088\/1757-899X\/420\/1\/012092","volume":"420","author":"S Gultom","year":"2018","unstructured":"Gultom S, Sriadhi S, Martiano M, Simarmata J. Comparison analysis of k-means and k-medoid with Ecluidience distance algorithm, Chanberra distance, and Chebyshev distance for big data clustering. IOP Conf Ser Mater Sci Eng. 2018;420(1):012092.","journal-title":"IOP Conf Ser Mater Sci Eng"},{"key":"1227_CR77","doi-asserted-by":"publisher","first-page":"507038","DOI":"10.3389\/fgene.2020.507038","volume":"11","author":"X Guo","year":"2020","unstructured":"Guo X. Js-ma: a jensen-shannon divergence based method for mapping genome-wide associations on multiple diseases. Front Genet. 2020;11:507038.","journal-title":"Front Genet"},{"key":"1227_CR78","doi-asserted-by":"crossref","unstructured":"Guo Y, Ding G, Han J, Zhao S, Wang B. Implicit non-linear similarity scoring for recognizing unseen classes. In Proc. of the 27th International Joint Conference on Artificial Intelligence. 2018;4898\u20134904.","DOI":"10.24963\/ijcai.2018\/680"},{"issue":"2","key":"1227_CR79","doi-asserted-by":"publisher","first-page":"147","DOI":"10.1002\/j.1538-7305.1950.tb00463.x","volume":"29","author":"RW Hamming","year":"1950","unstructured":"Hamming RW. Error detecting and error correcting codes. Bell Syst Tech J. 1950;29(2):147\u201360.","journal-title":"Bell Syst Tech J"},{"key":"1227_CR80","volume-title":"Introduction to social network methods","author":"RA Hanneman","year":"2005","unstructured":"Hanneman RA, Riddle M. Introduction to social network methods. Riverside: University of California; 2005."},{"key":"1227_CR81","unstructured":"Hassanat AB. Dimensionality invariant similarity measure. 2014."},{"key":"1227_CR82","doi-asserted-by":"publisher","first-page":"349","DOI":"10.4310\/SII.2009.v2.n3.a8","volume":"2","author":"T Hastie","year":"2009","unstructured":"Hastie T, Rosset S, Zhu J, Zou H. Multi-class adaboost. Stat interface. 2009;2:349\u201360.","journal-title":"Stat interface"},{"key":"1227_CR83","first-page":"439","volume":"5150","author":"M Hatzigiorgaki","year":"2003","unstructured":"Hatzigiorgaki M, Skodras AN. Compressed domain image retrieval: a comparative study of similarity metrics. Vis Commun Image Process. 2003;5150:439\u201348.","journal-title":"Vis Commun Image Process"},{"key":"1227_CR84","doi-asserted-by":"publisher","first-page":"108558","DOI":"10.1016\/j.comnet.2021.108558","volume":"203","author":"A Hbaieb","year":"2022","unstructured":"Hbaieb A, Ayed S, Chaari L. A survey of trust management in the internet of vehicles. Comput Netw. 2022;203:108558.","journal-title":"Comput Netw"},{"key":"1227_CR85","first-page":"575","volume":"61","author":"TS Hedges","year":"1976","unstructured":"Hedges TS. An empirical modication to linear wave theory. Inst Civ Eng. 1976;61:575\u20139.","journal-title":"Inst Civ Eng"},{"key":"1227_CR86","doi-asserted-by":"publisher","first-page":"210","DOI":"10.1515\/crll.1909.136.210","volume":"136","author":"E Hellinger","year":"1909","unstructured":"Hellinger E. Neue begr\u00fcndung der theorie quadratischer formen von unendlichvielen ver\u00e4nderlichen. J F\u00fcr Die Reine Angewandte Mathematik. 1909;136:210\u201371.","journal-title":"J F\u00fcr Die Reine Angewandte Mathematik"},{"key":"1227_CR87","doi-asserted-by":"publisher","DOI":"10.1101\/2024.09.30.615781","author":"L Hemm","year":"2024","unstructured":"Hemm L, Rabsch D, Ropp HR, Reimann V, Gerth P, Bartel J, Brenes-\u00c1lvarez M, Maass S, Becher D, Hess WR, et al. Rapdor: using Jensen-Shannon distance for the computational analysis of complex proteomics datasets. BioRxiv. 2024. https:\/\/doi.org\/10.1101\/2024.09.30.615781.","journal-title":"BioRxiv"},{"issue":"5","key":"1227_CR88","doi-asserted-by":"publisher","first-page":"739","DOI":"10.1002\/mds.26942","volume":"32","author":"EM Hill-Burns","year":"2017","unstructured":"Hill-Burns EM, Debelius JW, Morton JT, Wissemann WT, Lewis MR, Wallen ZD, Peddada SD, Factor SA, Molho E, Zabetian CP, Knight R, Payami H. Parkinson\u2019s disease and Parkinson\u2019s disease medications have distinct signatures of the gut microbiome. Mov Disord Off J Mov Disord Soc. 2017;32(5):739\u201349.","journal-title":"Mov Disord Off J Mov Disord Soc"},{"issue":"6","key":"1227_CR89","doi-asserted-by":"publisher","first-page":"341","DOI":"10.1145\/360825.360861","volume":"18","author":"DS Hirschberg","year":"1975","unstructured":"Hirschberg DS. A linear space algorithm for computing maximal common subsequences. Commun ACM. 1975;18(6):341\u20133.","journal-title":"Commun ACM"},{"key":"1227_CR90","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-14595-7","volume-title":"Normalization techniques in deep learning","author":"L Huang","year":"2022","unstructured":"Huang L. Normalization techniques in deep learning. Berlin: Springer; 2022."},{"key":"1227_CR91","doi-asserted-by":"publisher","first-page":"96","DOI":"10.1016\/j.compind.2015.12.001","volume":"78","author":"A Ittoo","year":"2016","unstructured":"Ittoo A, Nguyen LM, van den Bosch A. Text analytics in industry: challenges, desiderata and trends. Comput Ind. 2016;78:96\u2013107.","journal-title":"Comput Ind"},{"issue":"2","key":"1227_CR92","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1111\/j.1469-8137.1912.tb05611.x","volume":"11","author":"P Jaccard","year":"1912","unstructured":"Jaccard P. The distribution of the flora in the alpine zone. New Phytol. 1912;11(2):37\u201350.","journal-title":"New Phytol"},{"key":"1227_CR93","first-page":"52","volume":"644","author":"G Jacobson","year":"1992","unstructured":"Jacobson G, Vo K-P. Heaviest increasing\/common subsequence problems. Proc Comb Pattern Matching. 1992;644:52\u201366.","journal-title":"Proc Comb Pattern Matching"},{"issue":"406","key":"1227_CR94","doi-asserted-by":"publisher","first-page":"414","DOI":"10.1080\/01621459.1989.10478785","volume":"84","author":"MA Jaro","year":"1989","unstructured":"Jaro MA. Advances in record linkage methodology as applied to the 1985 census of Tampa Florida. J Am Stat Soc. 1989;84(406):414\u201320.","journal-title":"J Am Stat Soc"},{"key":"1227_CR95","doi-asserted-by":"publisher","first-page":"147","DOI":"10.1016\/j.geomorph.2012.11.005","volume":"182","author":"J Jasiewicz","year":"2013","unstructured":"Jasiewicz J, Stepinski TF. Geomorphons - a pattern recognition approach to classification and mapping of landforms. Geomorphology. 2013;182:147\u201356.","journal-title":"Geomorphology"},{"key":"1227_CR96","volume-title":"Theory of probability","author":"H Jeffreys","year":"1948","unstructured":"Jeffreys H. Theory of probability. 2nd ed. Oxford: Clarendon Press; 1948.","edition":"2"},{"key":"1227_CR97","unstructured":"Jurman G, Riccadonna S, Visintainer R, Furlanello C. Canberra distance on ranked lists. 2009."},{"key":"1227_CR98","unstructured":"Kamoi R, Kobayashi K. Why is the mahalanobis distance effective for anomaly detection? arXiv preprint arXiv:2003.00402, 2020."},{"issue":"43","key":"1227_CR99","doi-asserted-by":"publisher","first-page":"4315","DOI":"10.1016\/j.tcs.2009.07.013","volume":"410","author":"O Kapah","year":"2009","unstructured":"Kapah O, Landau GM, Levy A, Oz N. Interchange rearrangement: the element-cost model. Theoret Comput Sci. 2009;410(43):4315\u201326.","journal-title":"Theoret Comput Sci"},{"key":"1227_CR100","doi-asserted-by":"publisher","first-page":"392","DOI":"10.1016\/j.chnaes.2016.07.001","volume":"36","author":"B Kebede","year":"2016","unstructured":"Kebede B, Soromessa T, Kelbessa E. Floristic composition and community types of gedo dry evergreen montane forest, west Shewa, Ethiopia. Acta Ecol Sinica. 2016;36:392\u2013400.","journal-title":"Acta Ecol Sinica"},{"key":"1227_CR101","doi-asserted-by":"publisher","first-page":"170","DOI":"10.1016\/j.patrec.2016.09.006","volume":"184","author":"Y Kerimbekov","year":"2016","unstructured":"Kerimbekov Y, Bilge HS, U\u011furlu HH. The use of Lorentzian distance metric in classification problems. Pattern Recognit Lett. 2016;184:170\u20136.","journal-title":"Pattern Recognit Lett"},{"key":"1227_CR102","doi-asserted-by":"crossref","unstructured":"Kim T, Oh J, Kim N, Cho S, Yun S-Y. Comparing kullback-leibler divergence and mean squared error loss in knowledge distillation. arXiv preprint arXiv:2105.08919, 2021.","DOI":"10.24963\/ijcai.2021\/362"},{"issue":"2","key":"1227_CR103","doi-asserted-by":"publisher","first-page":"226","DOI":"10.20965\/jaciii.2021.p0226","volume":"25","author":"Y Kingetsu","year":"2021","unstructured":"Kingetsu Y, Hamasuna Y. Jensen-Shannon divergence-based k-medoids clustering. J Adv Comput Intell Intell Inform. 2021;25(2):226\u201333.","journal-title":"J Adv Comput Intell Intell Inform"},{"key":"1227_CR104","unstructured":"Koch G, Zemel R, Salakhutdinov R. Siamese neural networks for one-shot image recognition. In ICML deep learning workshop. Lille. 2015;2: 0."},{"key":"1227_CR105","doi-asserted-by":"crossref","unstructured":"Kociumaka T, Porat E, Starikovskaya T. Small-space and streaming pattern matching with $$k$$ edits. In IEEE 62nd Annual Symposium on Foundations of Computer Science. 2022;885\u2013896.","DOI":"10.1109\/FOCS52979.2021.00090"},{"key":"1227_CR106","doi-asserted-by":"crossref","unstructured":"Kondrak G. N-gram similarity and distance. In International symposium on string processing and information retrieval. 2005;115\u2013126.","DOI":"10.1007\/11575832_13"},{"key":"1227_CR107","doi-asserted-by":"publisher","first-page":"65","DOI":"10.1016\/B978-0-12-814761-0.00004-6","volume-title":"Data science","author":"V Kotu","year":"2019","unstructured":"Kotu V, Deshpande B. Chapter 4 - Classification. In: Kotu V, Deshpande B, editors. Data science. 2nd ed. Burlington: Morgan Kaufmann; 2019. p. 65\u2013163.","edition":"2"},{"key":"1227_CR108","volume-title":"Taxicab geometry: an adventure in non-Euclidean Geometry","author":"EF Krause","year":"1986","unstructured":"Krause EF. Taxicab geometry: an adventure in non-Euclidean Geometry. Mineola: Dover Publication. Inc.; 1986."},{"key":"1227_CR109","first-page":"57","volume":"II","author":"S Kulczynski","year":"1927","unstructured":"Kulczynski S. Die pflanzenassoziationen der pieninen. Bull Int De l\u2019Acad Polonaise Des Sci Et Des Lett Classe Des Sci Math Et Nat, B Sci Nat. 1927;II:57\u2013203.","journal-title":"Bull Int De l\u2019Acad Polonaise Des Sci Et Des Lett Classe Des Sci Math Et Nat, B Sci Nat"},{"issue":"4","key":"1227_CR110","doi-asserted-by":"publisher","first-page":"287","DOI":"10.1561\/2200000019","volume":"5","author":"B Kulis","year":"2013","unstructured":"Kulis B. Metric learning: a survey. Found Trends Mach Learn. 2013;5(4):287\u2013364.","journal-title":"Found Trends Mach Learn"},{"key":"1227_CR111","doi-asserted-by":"publisher","first-page":"79","DOI":"10.1214\/aoms\/1177729694","volume":"22","author":"S Kullback","year":"1951","unstructured":"Kullback S, Leibler RA. On information and sufficiency. Ann Math Stat. 1951;22:79\u201386.","journal-title":"Ann Math Stat"},{"issue":"13","key":"1227_CR112","doi-asserted-by":"publisher","first-page":"597","DOI":"10.12988\/ijcms.2006.06063","volume":"1","author":"P Kumar","year":"2006","unstructured":"Kumar P, Taneja IJ. Generalized relative j-divergence measure and properties. Int J Contemp Math Sci. 2006;1(13):597\u2013609.","journal-title":"Int J Contemp Math Sci"},{"key":"1227_CR113","doi-asserted-by":"crossref","unstructured":"Kurniawan YI, Soviana E, Yuliana I. Merging pearson correlation and tan-elr algorithm in recommender system. In AIP Conference Proceedings. AIP Publishing. 2018;1977.","DOI":"10.1063\/1.5042998"},{"key":"1227_CR114","doi-asserted-by":"publisher","first-page":"60","DOI":"10.1093\/comjnl\/9.1.60","volume":"9","author":"GN Lance","year":"1966","unstructured":"Lance GN, Williams WT. Computer programs for hierarchical polythetic classification (\u201csimilarity analyses\u201d). Comput J. 1966;9:60\u20134.","journal-title":"Comput J"},{"issue":"4","key":"1227_CR115","doi-asserted-by":"publisher","first-page":"705","DOI":"10.1016\/j.ic.2010.12.006","volume":"209","author":"GM Landau","year":"2011","unstructured":"Landau GM, Levy A, Newman I. LCS approximation via embedding into locally non-repetitive strings. Inf Comput. 2011;209(4):705\u201316.","journal-title":"Inf Comput"},{"issue":"2","key":"1227_CR116","doi-asserted-by":"publisher","first-page":"338","DOI":"10.1006\/jagm.2001.1191","volume":"41","author":"GM Landau","year":"2001","unstructured":"Landau GM, Ziv-Ukelson M. On the common substring alignment problem. J Algorithm. 2001;41(2):338\u201359.","journal-title":"J Algorithm"},{"key":"1227_CR117","unstructured":"Law M, Liao R, Snell J, Zemel R. Lorentzian distance learning for hyperbolic representations. In Proc. of the 36th International Conference on Machine Learning. 2019;97:3672\u20133681."},{"key":"1227_CR118","doi-asserted-by":"crossref","unstructured":"Lee S. Improving jaccard index for measuring similarity in collaborative filtering. In Information Science and Applications 2017: ICISA 2017 8. Springer; 2017. 799\u2013806.","DOI":"10.1007\/978-981-10-4154-9_93"},{"key":"1227_CR119","first-page":"707","volume":"10","author":"VI Levenshtein","year":"1966","unstructured":"Levenshtein VI. Binary codes capable of correcting deletions, insertions and reversals. Soviet Phys Doklady. 1966;10:707\u201310.","journal-title":"Soviet Phys Doklady"},{"key":"1227_CR120","doi-asserted-by":"publisher","first-page":"102737","DOI":"10.1016\/j.ecoinf.2024.102737","volume":"82","author":"A Levy","year":"2024","unstructured":"Levy A, Barash A, Zaguri C, Hadad A, Polsky P. Improving deep learning based bluespotted ribbontail ray (taeniura lymma) recognition. Eco Inform. 2024;82:102737.","journal-title":"Eco Inform"},{"key":"1227_CR121","doi-asserted-by":"publisher","first-page":"150","DOI":"10.1016\/j.jesp.2017.09.011","volume":"74","author":"C Leys","year":"2018","unstructured":"Leys C, Klein O, Dominicy Y, Ley C. Detecting multivariate outliers: use a robust variant of the mahalanobis distance. J Exp Soc Psychol. 2018;74:150\u20136.","journal-title":"J Exp Soc Psychol"},{"issue":"2","key":"1227_CR122","doi-asserted-by":"publisher","first-page":"500","DOI":"10.3390\/sym15020500","volume":"15","author":"X Li","year":"2023","unstructured":"Li X, Liu Z, Han X, Liu N, Yuan W. An intuitionistic fuzzy version of hellinger distance measure and its application to decision-making process. Symmetry. 2023;15(2):500.","journal-title":"Symmetry"},{"issue":"5","key":"1227_CR123","first-page":"4197","volume":"35","author":"X Li","year":"2021","unstructured":"Li X, Li P. Rejection sampling for weighted Jaccard similarity revisited. Proc AAAI Conf Artif Intell. 2021;35(5):4197\u2013205.","journal-title":"Proc AAAI Conf Artif Intell"},{"issue":"9","key":"1227_CR124","doi-asserted-by":"publisher","first-page":"4489","DOI":"10.1016\/j.jfranklin.2022.03.037","volume":"359","author":"H Liang","year":"2022","unstructured":"Liang H, Zhao S, Li N. Multi-fidelity and learning-regularization for single image super resolution. J Franklin Inst. 2022;359(9):4489\u2013512.","journal-title":"J Franklin Inst"},{"key":"1227_CR125","doi-asserted-by":"publisher","first-page":"77","DOI":"10.1007\/s11047-020-09791-6","volume":"20","author":"J Liang","year":"2021","unstructured":"Liang J, Wei Y, Boyang Q, Yue C, Song H. Ensemble learning based on fitness Euclidean-distance ratio differential evolution for classification. Nat Comput. 2021;20:77\u201387.","journal-title":"Nat Comput"},{"key":"1227_CR126","unstructured":"Lin H-T, Li L. Novel distance-based svm kernels for infinite ensemble learning. In Proceedings of the 12th International Conference on Neural Information Processing. 2005;761\u2013766."},{"issue":"1","key":"1227_CR127","doi-asserted-by":"publisher","first-page":"145","DOI":"10.1109\/18.61115","volume":"37","author":"J Lin","year":"1991","unstructured":"Lin J. Divergence measures based on the Shannon entropy. IEEE Trans Inf Theory. 1991;37(1):145\u201351.","journal-title":"IEEE Trans Inf Theory"},{"issue":"9","key":"1227_CR128","doi-asserted-by":"publisher","first-page":"1020","DOI":"10.1016\/j.ic.2010.04.001","volume":"208","author":"O Lipsky","year":"2010","unstructured":"Lipsky O, Porat B, Porat E, Shalom BR, Tsur D. String matching with up to k swaps and mismatches. Inf Comput. 2010;208(9):1020\u201330.","journal-title":"Inf Comput"},{"key":"1227_CR129","doi-asserted-by":"crossref","unstructured":"Liu K, Brand L, Wang H, Nie F. Learning robust distance metric with side information via ratio minimization of orthogonally constrained L2-norm distances. In Proc. of the 28th International Joint Conference on Artificial Intelligence. 2019;3008\u20133014.","DOI":"10.24963\/ijcai.2019\/417"},{"key":"1227_CR130","doi-asserted-by":"crossref","unstructured":"Liu Z, Hu W. Fsm: A fast similarity measurement for gene regulatory networks via genes\u2019 influence power. In Proc. of the 28th International Joint Conference on Artificial Intelligence. 2019;4547\u20134553.","DOI":"10.24963\/ijcai.2019\/632"},{"key":"1227_CR131","doi-asserted-by":"publisher","first-page":"409","DOI":"10.2307\/1933315","volume":"41","author":"J Looman","year":"1960","unstructured":"Looman J, Campbell JB. Adaptation of sorensen\u2019s K (1948) for estimating unit affinities in prairie vegetation. Ecology. 1960;41:409\u201316.","journal-title":"Ecology"},{"key":"1227_CR132","doi-asserted-by":"crossref","unstructured":"Lv W, Huang H, Tang W, Chen T. Research and application of intersection similarity algorithm based on knn classification model. In 2021 International Conference on Artificial Intelligence, Big Data and Algorithms (CAIBDA). 2021;141\u2013144.","DOI":"10.1109\/CAIBDA53561.2021.00037"},{"key":"1227_CR133","unstructured":"Macklem M. Multidimensional modelling of image fidelity measures. M.\u00a0sc.\u00a0dissertation, Simon Fraser University, 2002."},{"key":"1227_CR134","first-page":"541","volume":"26","author":"PC Mahalanobis","year":"1930","unstructured":"Mahalanobis PC. On tests and measures of groups divergence. J Asiatic Sociol Bengal. 1930;26:541\u201388.","journal-title":"J Asiatic Sociol Bengal"},{"key":"1227_CR135","doi-asserted-by":"publisher","first-page":"012080","DOI":"10.1088\/1742-6596\/1450\/1\/012080","volume":"1450","author":"E Maria","year":"2020","unstructured":"Maria E, Budiman E, Taruk M, et al. Measure distance locating nearest public facilities using haversine and Euclidean methods. J Phys Conf Ser. 2020;1450:012080.","journal-title":"J Phys Conf Ser"},{"issue":"4","key":"1227_CR136","doi-asserted-by":"publisher","first-page":"631","DOI":"10.1214\/aoms\/1177728422","volume":"26","author":"K Matusita","year":"1955","unstructured":"Matusita K. Decision rules based on the distance for problems of fit, two samples and estimation. Ann Math Stat. 1955;26(4):631\u201340.","journal-title":"Ann Math Stat"},{"key":"1227_CR137","unstructured":"McCaffrey JD. Calculating the mahalanobis distance. https:\/\/jamesmccaffrey.wordpress.com\/2017\/11\/09, 2017."},{"key":"1227_CR138","doi-asserted-by":"publisher","first-page":"135","DOI":"10.1016\/j.ins.2019.09.027","volume":"510","author":"J McCulloch","year":"2020","unstructured":"McCulloch J, Wagner C. On the choice of similarity measures for type-2 fuzzy sets. Inf Sci. 2020;510:135\u201354. https:\/\/doi.org\/10.1016\/j.ins.2019.09.027.","journal-title":"Inf Sci"},{"key":"1227_CR139","doi-asserted-by":"publisher","first-page":"143","DOI":"10.11613\/BM.2013.018","volume":"23","author":"ML McHugh","year":"2013","unstructured":"McHugh ML. The Chi-square test of independence. Biochem Med. 2013;23:143\u20139.","journal-title":"Biochem Med"},{"key":"1227_CR140","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1007\/BF02834632","volume":"4","author":"GJ McLachlan","year":"1999","unstructured":"McLachlan GJ. Mahalanobis distance. Resonance. 1999;4:20\u20136.","journal-title":"Resonance"},{"key":"1227_CR141","unstructured":"Motyka J, Dobrzanski B, Zawadzki S. Preliminary studies on meadows in the south-east of lublin province. Ann Univ Mariae Curie-Sklodowska 5E. 1950;367\u2013447."},{"key":"1227_CR142","volume-title":"Encyclopedia of social network analysis and mining","author":"MS Mulekar","year":"2018","unstructured":"Mulekar MS, Brown CS. Distance and similarity measures. In: Alhajj R, Rokne JG, editors. Encyclopedia of social network analysis and mining. 2nd ed. Berlin: Springer; 2018.","edition":"2"},{"issue":"3","key":"1227_CR143","doi-asserted-by":"publisher","first-page":"443","DOI":"10.1016\/0022-2836(70)90057-4","volume":"48","author":"SB Needleman","year":"1970","unstructured":"Needleman SB, Wunsch CD. A general method applicable to the search for similarities in the amino acid sequence of two proteins. J Mol Biol. 1970;48(3):443\u201353.","journal-title":"J Mol Biol"},{"key":"1227_CR144","unstructured":"Neyman J. Contributions to the theory of the $$\\chi ^2$$ test. In Proc. the First Berkley Symposium on Mathematical Statistics and Probability. 1949."},{"key":"1227_CR145","unstructured":"Nickel M, Kiela D. Learning continuous hierarchies in the lorentz model of hyperbolic geometry. In International Conference on Machine Learning. PMLR. 2018;3779\u20133788."},{"issue":"5","key":"1227_CR146","doi-asserted-by":"publisher","first-page":"485","DOI":"10.3390\/e21050485","volume":"21","author":"F Nielsen","year":"2019","unstructured":"Nielsen F. On the Jensen-Shannon symmetrization of distances relying on abstract means. Entropy. 2019;21(5):485.","journal-title":"Entropy"},{"issue":"2","key":"1227_CR147","doi-asserted-by":"publisher","first-page":"221","DOI":"10.3390\/e22020221","volume":"22","author":"F Nielsen","year":"2020","unstructured":"Nielsen F. On a generalization of the Jensen-Shannon divergence and the Jensen-Shannon centroid. Entropy. 2020;22(2):221.","journal-title":"Entropy"},{"issue":"3","key":"1227_CR148","doi-asserted-by":"publisher","first-page":"731","DOI":"10.1007\/s00500-014-1296-7","volume":"19","author":"F Noorbehbahani","year":"2015","unstructured":"Noorbehbahani F, Mousavi SR, Mirzaei A. An incremental mixed data clustering method using a new distance measure. Soft Comput. 2015;19(3):731\u201343.","journal-title":"Soft Comput"},{"issue":"1","key":"1227_CR149","doi-asserted-by":"publisher","first-page":"87","DOI":"10.1016\/0033-5894(85)90074-2","volume":"23","author":"JT Overpeck","year":"1985","unstructured":"Overpeck JT, Webb T, Prentice IC. Quantitative interpretation of fossil pollen spectra: dissimilarity coefficients and the method of modern analogs. Quat Res. 1985;23(1):87\u2013108.","journal-title":"Quat Res"},{"key":"1227_CR150","doi-asserted-by":"crossref","unstructured":"Papineni K, Roukos S, Ward T, Zhu W-J. Bleu: a method for automatic evaluation of machine translation. In Proc. of the 40th annual meeting of the Association for Computational Linguistics. 2002;311\u2013318.","DOI":"10.3115\/1073083.1073135"},{"key":"1227_CR151","doi-asserted-by":"publisher","first-page":"122435","DOI":"10.1016\/j.eswa.2023.122435","volume":"239","author":"G Park","year":"2024","unstructured":"Park G, Cho M, Lee J. Leveraging machine learning for automatic topic discovery and forecasting of process mining research: a literature review. Expert Syst Appl. 2024;239:122435.","journal-title":"Expert Syst Appl"},{"key":"1227_CR152","doi-asserted-by":"publisher","first-page":"157","DOI":"10.1080\/14786440009463897","volume":"50","author":"K Pearson","year":"1900","unstructured":"Pearson K. On the criterion that a given system of deviations from the probable in the case of correlated system of variables is such that it can be reasonable supposed to have arisen from random sampling. Phil Mag. 1900;50:157\u201372.","journal-title":"Phil Mag"},{"key":"1227_CR153","doi-asserted-by":"crossref","unstructured":"Podolskiy AV, Lipin D, Bout A, Artemova E, Piontkovskaya I. Revisiting mahalanobis distance for transformer-based out-of-domain detection. In Proc. AAAI Conference on Artifical Intelligence. 2021;13675\u201313682.","DOI":"10.1609\/aaai.v35i15.17612"},{"key":"1227_CR154","doi-asserted-by":"publisher","first-page":"106776","DOI":"10.1016\/j.cmpb.2022.106776","volume":"219","author":"R Pramanik","year":"2022","unstructured":"Pramanik R, Biswas M, Sen S, de Souza LA, Papa JP, Sarkar R. A fuzzy distance-based ensemble of deep models for cervical cancer detection. Comput Methods Progr Biomed. 2022;219:106776.","journal-title":"Comput Methods Progr Biomed"},{"key":"1227_CR155","doi-asserted-by":"publisher","first-page":"77","DOI":"10.1016\/j.anbehav.2015.01.010","volume":"102","author":"M-T Puth","year":"2015","unstructured":"Puth M-T, Neuh\u00e4user M, Ruxton GD. Effective use of spearman\u2019s and Kendall\u2019s correlation coefficients for association between two measured traits. Animal Behav. 2015;102:77\u201384.","journal-title":"Animal Behav"},{"issue":"8","key":"1227_CR156","doi-asserted-by":"publisher","first-page":"2741","DOI":"10.1109\/TNNLS.2019.2929575","volume":"31","author":"Y Qiao","year":"2020","unstructured":"Qiao Y, Yuewei W, Duo F, Lin W, Yang J. Siamese neural networks for user identity linkage through web browsing. IEEE Trans Neural Netw Learn Syst. 2020;31(8):2741\u201351.","journal-title":"IEEE Trans Neural Netw Learn Syst"},{"key":"1227_CR157","doi-asserted-by":"publisher","first-page":"46","DOI":"10.1016\/j.neucom.2020.04.125","volume":"409","author":"Q Qin","year":"2020","unstructured":"Qin Q, Huang L, Wei Z. Deep multilevel similarity hashing with fine-grained features for multi-label image retrieval. Neurocomputing. 2020;409:46\u201359.","journal-title":"Neurocomputing"},{"key":"1227_CR158","doi-asserted-by":"crossref","unstructured":"Rahman Z, Hussain A, Shah H, Arshad M, et\u00a0al. Urdu news clustering using k-mean algorithm on the basis of jaccard coefficient and dice coefficient similarity. 2022.","DOI":"10.14201\/ADCAIJ2021104381399"},{"key":"1227_CR159","doi-asserted-by":"crossref","unstructured":"Raiber F, Kurland O. Kullback-leibler divergence revisited. In Proceedings of the ACM SIGIR international conference on theory of information retrieval. 2017;117\u2013124.","DOI":"10.1145\/3121050.3121062"},{"key":"1227_CR160","first-page":"23","volume":"19","author":"CR Rao","year":"1995","unstructured":"Rao CR. A review of canonical coordinates and an alternative to correspondence analysis using hellinger distance. Q\u00fcestii\u00f3 Quaderns D\u2019estad\u00edstica i Investigaci\u00f3 Operativa. 1995;19:23.","journal-title":"Q\u00fcestii\u00f3 Quaderns D\u2019estad\u00edstica i Investigaci\u00f3 Operativa"},{"key":"1227_CR161","doi-asserted-by":"publisher","first-page":"66","DOI":"10.1016\/j.patrec.2018.03.021","volume":"110","author":"\u00c9O Rodrigues","year":"2018","unstructured":"Rodrigues \u00c9O. Combining minkowski and chebyshev: New distance proposal and survey of distance metrics using k-nearest neighbours classifier. Pattern Recogn Lett. 2018;110:66\u201371.","journal-title":"Pattern Recogn Lett"},{"key":"1227_CR162","unstructured":"Rosenfeld A. Better metrics for evaluating explainable artificial intelligence. In Proc. of the 20th international conference on autonomous agents and multiagent systems. 2021;45\u201350."},{"key":"1227_CR163","doi-asserted-by":"crossref","unstructured":"Roth K, Brattoli B, Ommer B. Mic: Mining interclass characteristics for improved metric learning. In Proc. of the IEEE\/CVF International Conference on Computer Vision. 2019;8000\u20138009.","DOI":"10.1109\/ICCV.2019.00809"},{"key":"1227_CR164","volume-title":"Information science and statistics","author":"RY Rubinstein","year":"2004","unstructured":"Rubinstein RY, Kroese DP. The cross-entropy method: a unified approach to combinatorial optimization, Monte-Carlo simulation and machine learning. In: Rubinstein RY, Kroese DP, editors. Information science and statistics. 1st ed. New York: Springer; 2004.","edition":"1"},{"key":"1227_CR165","first-page":"647","volume":"13","author":"M Ruzicka","year":"1958","unstructured":"Ruzicka M. Anwendung mathematisch-statistiker methoden in geobotanik (synthetische bearbeitung von aufnahmen). Biologia. 1958;13:647\u201361.","journal-title":"Biologia"},{"issue":"5","key":"1227_CR166","doi-asserted-by":"publisher","first-page":"1763","DOI":"10.1213\/ANE.0000000000002864","volume":"126","author":"P Schober","year":"2018","unstructured":"Schober P, Boer C, Schwarte LA. Correlation coefficients: appropriate use and interpretation. Anesth Analg. 2018;126(5):1763\u20138.","journal-title":"Anesth Analg"},{"issue":"5","key":"1227_CR167","doi-asserted-by":"publisher","first-page":"271","DOI":"10.3390\/info14050271","volume":"14","author":"B Shade","year":"2023","unstructured":"Shade B, Altmann EG. Quantifying the dissimilarity of texts. Information. 2023;14(5):271.","journal-title":"Information"},{"key":"1227_CR168","doi-asserted-by":"crossref","unstructured":"Shapira D, Storer JA. Large edit distance with multiple block operations. In String Processing and Information Retrieval: 10th International Symposium, SPIRE 2003, Manaus, Brazil, October 8-10, 2003. Proceedings 10. Springer. 2003;369\u2013377.","DOI":"10.1007\/978-3-540-39984-1_29"},{"issue":"10","key":"1227_CR169","doi-asserted-by":"publisher","first-page":"1537","DOI":"10.1016\/j.neunet.2008.07.001","volume":"21","author":"F Shen","year":"2008","unstructured":"Shen F, Hasegawa O. A fast nearest neighbor classifier based on self-organizing incremental neural network. Neural Netw. 2008;21(10):1537\u201347.","journal-title":"Neural Netw"},{"key":"1227_CR170","doi-asserted-by":"publisher","first-page":"329","DOI":"10.1007\/s40031-020-00501-5","volume":"102","author":"R Singh","year":"2021","unstructured":"Singh R, Singh S. Text similarity measures in news articles by vector space model using nlp. J Inst Eng (India) Ser B. 2021;102:329\u201338.","journal-title":"J Inst Eng (India) Ser B"},{"key":"1227_CR171","doi-asserted-by":"publisher","first-page":"195","DOI":"10.1016\/0022-2836(81)90087-5","volume":"147","author":"TF Smith","year":"1981","unstructured":"Smith TF, Waterman MS. Identification of common molecular subsequences. J Mol Biol. 1981;147:195\u20137.","journal-title":"J Mol Biol"},{"key":"1227_CR172","doi-asserted-by":"publisher","first-page":"129","DOI":"10.1016\/0020-0271(67)90006-X","volume":"3","author":"D Soergel","year":"1967","unstructured":"Soergel D. Mathematical analysis of documentation systems. Inf Storage Retr. 1967;3:129\u201373.","journal-title":"Inf Storage Retr"},{"issue":"6","key":"1227_CR173","doi-asserted-by":"publisher","first-page":"1985","DOI":"10.1007\/s00500-017-2912-0","volume":"23","author":"Y Song","year":"2019","unstructured":"Song Y, Wang X, Quan W, Huang W. A new approach to construct similarity measure for intuitionistic fuzzy sets. Soft Comput. 2019;23(6):1985\u201398.","journal-title":"Soft Comput"},{"issue":"4","key":"1227_CR174","first-page":"1","volume":"5","author":"T S\u00f8rensen","year":"1948","unstructured":"S\u00f8rensen T. A method of establishing groups of equal amplitude in plant sociology based on similarity of species and its application to analyses of the vegetation on Danish commons. Kongelige Danske Videnskabernes Selskab. 1948;5(4):1\u201334.","journal-title":"Kongelige Danske Videnskabernes Selskab"},{"issue":"1","key":"1227_CR175","doi-asserted-by":"publisher","first-page":"72","DOI":"10.2307\/1412159","volume":"15","author":"CE Spearman","year":"1904","unstructured":"Spearman CE. The proof and measurement of association between two things. Am J Psychol. 1904;15(1):72\u2013101.","journal-title":"Am J Psychol"},{"issue":"1","key":"1227_CR176","doi-asserted-by":"publisher","first-page":"261","DOI":"10.1186\/s13643-024-02680-4","volume":"13","author":"LM Spineli","year":"2024","unstructured":"Spineli LM. Local inconsistency detection using the Kullback-Leibler divergence measure. Syst Rev. 2024;13(1):261.","journal-title":"Syst Rev"},{"key":"1227_CR177","doi-asserted-by":"crossref","unstructured":"Steck H, Ekanadham C, Kallus N. Is cosine-similarity of embeddings really about similarity? In Companion Proceedings of the ACM Web Conference 2024. 2024;887\u201390.","DOI":"10.1145\/3589335.3651526"},{"issue":"7772","key":"1227_CR178","doi-asserted-by":"publisher","first-page":"117","DOI":"10.1038\/s41586-019-1507-6","volume":"573","author":"AJ Stewart","year":"2019","unstructured":"Stewart AJ, Mosleh M, Diakonova M, Arechar AA, Rand DG, Plotkin JB. Information gerrymandering and undemocratic decisions. Nature. 2019;573(7772):117\u201321.","journal-title":"Nature"},{"key":"1227_CR179","doi-asserted-by":"crossref","unstructured":"Sun Y, Wang X, Tang X. Deep learning face representation from predicting 10,000 classes. In Proc.of the IEEE conference on computer vision and pattern recognition. 2014;1891\u20131898.","DOI":"10.1109\/CVPR.2014.244"},{"issue":"1","key":"1227_CR180","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1007\/BF00130487","volume":"7","author":"MJ Swain","year":"1991","unstructured":"Swain MJ, Ballard DH. Color indexing. Int J Comput Vision. 1991;7(1):11\u201332.","journal-title":"Int J Comput Vision"},{"key":"1227_CR181","doi-asserted-by":"crossref","unstructured":"S\u00e1nchez DL, Corchado JM, S\u00e1nchez AGAL, Corchado JM, Arrieta AG. Inhibition of occluded facial regions for distance-based face recognition. In Proc. of the 27th International Joint Conference on Artificial Intelligence. 2018;5324\u20135328.","DOI":"10.24963\/ijcai.2018\/746"},{"key":"1227_CR182","doi-asserted-by":"crossref","unstructured":"Taigman Y, Yang M, Ranzato M, Wolf L. Deepface: Closing the gap to human-level performance in face verification. In Proc. of the IEEE conference on computer vision and pattern recognition. 2014;1701\u20131708.","DOI":"10.1109\/CVPR.2014.220"},{"key":"1227_CR183","volume-title":"Descriptive physical oceanography","author":"LD Talley","year":"2011","unstructured":"Talley LD, Pickard GL, Emery WJ, Swift JH. Descriptive physical oceanography. 6th ed. Boston: Academic Press; 2011.","edition":"6"},{"key":"1227_CR184","doi-asserted-by":"publisher","first-page":"327","DOI":"10.1016\/S0065-2539(08)60580-6","volume-title":"Advances in electronics and electron physics","author":"IJ Taneja","year":"1989","unstructured":"Taneja IJ. On generalized information measures and their applications. In: Hawkes PW, editor. Advances in electronics and electron physics. Cambridge: Academic Press; 1989. p. 327\u2013413."},{"key":"1227_CR185","volume-title":"An elementary mathematical theory of classification and prediction","author":"TT Tanimoto","year":"1958","unstructured":"Tanimoto TT. An elementary mathematical theory of classification and prediction. New York: International Business Machines Corporation; 1958."},{"key":"1227_CR186","doi-asserted-by":"publisher","first-page":"122644","DOI":"10.1016\/j.eswa.2023.122644","volume":"244","author":"TH Teng","year":"2024","unstructured":"Teng TH, Varathan KD, Crestani F. A comprehensive review of cyberbullying-related content classification in online social media. Expert Syst Appl. 2024;244:122644.","journal-title":"Expert Syst Appl"},{"key":"1227_CR187","unstructured":"Tessari F, Yao K, Hogan N. Surpassing cosine similarity for multidimensional comparisons: Dimension insensitive euclidean metric (diem), 2024."},{"key":"1227_CR188","doi-asserted-by":"crossref","unstructured":"Tian Y, Fan B, Wu F. L2-net: Deep learning of discriminative patch descriptor in Euclidean space. In IEEE Conference on Computer Vision and Pattern Recognition. 2017;6128\u20136136.","DOI":"10.1109\/CVPR.2017.649"},{"issue":"12","key":"1227_CR189","first-page":"1","volume":"21","author":"X Tong","year":"2020","unstructured":"Tong X, Xia L, Wang J, Feng Y. Neyman-Pearson classification: parametrics and sample size requirement. J Mach Learn Res. 2020;21(12):1\u201348.","journal-title":"J Mach Learn Res"},{"issue":"4","key":"1227_CR190","doi-asserted-by":"publisher","first-page":"1602","DOI":"10.1109\/18.850703","volume":"46","author":"F Tops\u00f8e","year":"2000","unstructured":"Tops\u00f8e F. Some inequalities for information divergence and related measures of discrimination. IEEE Trans Inf Theory. 2000;46(4):1602\u20139.","journal-title":"IEEE Trans Inf Theory"},{"issue":"2","key":"1227_CR191","doi-asserted-by":"publisher","first-page":"275","DOI":"10.1109\/PROC.1977.10469","volume":"65","author":"GT Toussaint","year":"1977","unstructured":"Toussaint GT. An upper bound on the probability of misclassification in terms of the affinity. Proc IEEE. 1977;65(2):275\u20136.","journal-title":"Proc IEEE"},{"issue":"1","key":"1227_CR192","doi-asserted-by":"publisher","first-page":"233","DOI":"10.1186\/s12859-022-04769-w","volume":"23","author":"A Ultsch","year":"2022","unstructured":"Ultsch A, L\u00f6tsch J. Euclidean distance-optimized data transformation for cluster analysis in biomedical data (edotrans). BMC Bioinform. 2022;23(1):233.","journal-title":"BMC Bioinform"},{"key":"1227_CR193","doi-asserted-by":"publisher","DOI":"10.1002\/9780470974414","volume-title":"Statistical methods for fuzzy data","author":"R Viertl","year":"2011","unstructured":"Viertl R. Statistical methods for fuzzy data. Hoboken: John Wiley & Sons; 2011."},{"issue":"2","key":"1227_CR194","doi-asserted-by":"publisher","first-page":"165","DOI":"10.1214\/aoms\/1177730030","volume":"20","author":"A Wald","year":"1949","unstructured":"Wald A. Statistical decision functions. Ann Math Stat. 1949;20(2):165\u2013205.","journal-title":"Ann Math Stat"},{"key":"1227_CR195","doi-asserted-by":"publisher","first-page":"215","DOI":"10.1016\/j.neucom.2020.10.081","volume":"429","author":"M Wang","year":"2021","unstructured":"Wang M, Deng W. Deep face recognition: a survey. Neurocomputing. 2021;429:215\u201344.","journal-title":"Neurocomputing"},{"key":"1227_CR196","first-page":"10201","volume":"35","author":"S Wang","year":"2021","unstructured":"Wang S, Eykholt K, Lee T, Jang J, Molloy I. Adaptive verifiable training using pairwise class similarity. Proc AAAI Conf Artif Intell. 2021;35:10201\u20139.","journal-title":"Proc AAAI Conf Artif Intell"},{"key":"1227_CR197","doi-asserted-by":"crossref","unstructured":"Wang X, Han X, Huang W, Dong D, Scott MR. Multi-similarity loss with general pair weighting for deep metric learning. In Proc. of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 2019;5022\u20135030.","DOI":"10.1109\/CVPR.2019.00516"},{"key":"1227_CR198","doi-asserted-by":"crossref","unstructured":"Wang Y, Wu S, Jiang W, Hao S, Tan Y, Zhang Q. Demiguise attack: Crafting invisible semantic adversarial perturbations with perceptual similarity. In Proc. of the 30th International Joint Conference on Artificial Intelligence. 2021;3125\u20133133.","DOI":"10.24963\/ijcai.2021\/430"},{"key":"1227_CR199","doi-asserted-by":"publisher","first-page":"983","DOI":"10.1021\/ci9800211","volume":"38","author":"P Willett","year":"1998","unstructured":"Willett P, Barnard JM, Downs GM. Chemical similarity searching. J Chem Inform Comput Sci. 1998;38:983\u201396.","journal-title":"J Chem Inform Comput Sci"},{"key":"1227_CR200","unstructured":"Winkler WE. String comparator metrics and enhanced decision rules in the Fellegi-Sunter model of record linkage. In Proc of the Section on Survey Research. 1990;354\u2013359."},{"issue":"2","key":"1227_CR201","doi-asserted-by":"publisher","first-page":"241","DOI":"10.1016\/S0893-6080(05)80023-1","volume":"5","author":"DH Wolpert","year":"1992","unstructured":"Wolpert DH. Stacked generalization. Neural Netw. 1992;5(2):241\u201359.","journal-title":"Neural Netw"},{"key":"1227_CR202","doi-asserted-by":"crossref","unstructured":"Wu C-Y, Manmatha R, Smola AJ, Krahenbuhl P. Sampling matters in deep embedding learning. In Proc of the IEEE International Conference on Computer Vision. 2017;2840\u20132848.","DOI":"10.1109\/ICCV.2017.309"},{"issue":"7","key":"1227_CR203","doi-asserted-by":"publisher","first-page":"1373","DOI":"10.3390\/f14071373","volume":"14","author":"F Xu","year":"2023","unstructured":"Xu F, Xu Z, Xu C, Yu T. Automatic extraction of the spatial distribution of Picea Schrenkiana in the Tianshan mountains based on google earth engine and the Jeffries-Matusita distance. Forests. 2023;14(7):1373.","journal-title":"Forests"},{"key":"1227_CR204","doi-asserted-by":"crossref","unstructured":"Xu J, Luo L, Deng C, Huang H. Multi-level metric learning via smoothed wasserstein distance. In Proc. of the 27th International Joint Conference on Artificial Intelligence. 2018;2919\u20132925.","DOI":"10.24963\/ijcai.2018\/405"},{"key":"1227_CR205","doi-asserted-by":"publisher","first-page":"13","DOI":"10.1016\/j.eswa.2016.01.035","volume":"54","author":"X Jingxin","year":"2016","unstructured":"Jingxin X, Denman S, Fookes C, Sridharan S. Detecting rare events using Kullback-Leibler divergence: a weakly supervised approach. Expert Syst Appl. 2016;54:13\u201328.","journal-title":"Expert Syst Appl"},{"key":"1227_CR206","doi-asserted-by":"crossref","unstructured":"Yang E, Deng C, Liu T, Liu W, Tao D. Semantic structure-based unsupervised deep hashing. In Proc. of the 27th international joint conference on artificial intelligence. 2018;1064\u20131070.","DOI":"10.24963\/ijcai.2018\/148"},{"issue":"4","key":"1227_CR207","first-page":"4901","volume":"38","author":"S Yin","year":"2020","unstructured":"Yin S, Wang T. An unknown protocol improved k-means clustering algorithm based on Pearson distance. J Intell Fuzzy Syst. 2020;38(4):4901\u201313.","journal-title":"J Intell Fuzzy Syst"},{"key":"1227_CR208","doi-asserted-by":"crossref","unstructured":"Yu Z, Cao R, Tang Q, Nie S, Huang J, Wu S. Order matters: Semantic-aware neural networks for binary code similarity detection. In Proc. of the AAAI Conference on Artificial Intelligence. 2020;1145\u20131152.","DOI":"10.1609\/aaai.v34i01.5466"},{"key":"1227_CR209","doi-asserted-by":"crossref","unstructured":"Zakani FR, Arhid K, Bouksim M, Gadi T, Aboulfatah M. Kulczynski similarity index for objective evaluation of mesh segmentation algorithms. In 2016 5th International Conference on Multimedia Computing and Systems (ICMCS). 2016;12\u201317.","DOI":"10.1109\/ICMCS.2016.7905611"},{"issue":"1","key":"1227_CR210","doi-asserted-by":"publisher","first-page":"012103","DOI":"10.1088\/1742-6596\/1566\/1\/012103","volume":"1566","author":"N Zendrato","year":"2020","unstructured":"Zendrato N, Dhany HW, Siagian NA, Izhari F. Bigdata clustering using x-means method with Euclidean distance. J Phys Conf Ser. 2020;1566(1):012103.","journal-title":"J Phys Conf Ser"},{"issue":"8","key":"1227_CR211","doi-asserted-by":"publisher","first-page":"5790","DOI":"10.1109\/TII.2020.3047675","volume":"17","author":"X Zhou","year":"2021","unstructured":"Zhou X, Liang W, Shimizu S, Ma J, Jin Q. Siamese neural network based few-shot learning for anomaly detection in industrial cyber-physical systems. IEEE Trans Industr Inf. 2021;17(8):5790\u20138.","journal-title":"IEEE Trans Industr Inf"},{"issue":"2","key":"1227_CR212","doi-asserted-by":"publisher","first-page":"221","DOI":"10.1016\/0888-613X(87)90015-6","volume":"1","author":"R Zwick","year":"1987","unstructured":"Zwick R, Carlstein E, Budescu DV. Measures of similarity among fuzzy concepts: a comparative analysis. Int J Approx Reason. 1987;1(2):221\u201342.","journal-title":"Int J Approx Reason"}],"container-title":["Journal of Big Data"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s40537-025-01227-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s40537-025-01227-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s40537-025-01227-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,8]],"date-time":"2025-09-08T05:26:25Z","timestamp":1757309185000},"score":1,"resource":{"primary":{"URL":"https:\/\/journalofbigdata.springeropen.com\/articles\/10.1186\/s40537-025-01227-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,7,26]]},"references-count":212,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2025,12]]}},"alternative-id":["1227"],"URL":"https:\/\/doi.org\/10.1186\/s40537-025-01227-1","relation":{},"ISSN":["2196-1115"],"issn-type":[{"value":"2196-1115","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,7,26]]},"assertion":[{"value":"1 December 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"21 June 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"26 July 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"Not applicable.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"The authors have no competing interests as defined by Springer, or other interests that might be perceived to influence the results and\/or discussion reported in this paper.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"188"}}