{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,16]],"date-time":"2025-10-16T07:02:10Z","timestamp":1760598130620,"version":"3.37.3"},"reference-count":37,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2022,2,17]],"date-time":"2022-02-17T00:00:00Z","timestamp":1645056000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,2,17]],"date-time":"2022-02-17T00:00:00Z","timestamp":1645056000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Knowl Inf Syst"],"published-print":{"date-parts":[[2022,3]]},"DOI":"10.1007\/s10115-022-01658-9","type":"journal-article","created":{"date-parts":[[2022,2,17]],"date-time":"2022-02-17T05:02:33Z","timestamp":1645074153000},"page":"723-742","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":7,"title":["Postimpact similarity: a similarity measure for effective grouping of unlabelled text using spectral clustering"],"prefix":"10.1007","volume":"64","author":[{"given":"Arnab Kumar","family":"Roy","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9536-8075","authenticated-orcid":false,"given":"Tanmay","family":"Basu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,2,17]]},"reference":[{"issue":"6","key":"1658_CR1","doi-asserted-by":"publisher","first-page":"601","DOI":"10.1109\/TSMCC.2010.2053532","volume":"40","author":"C Romero","year":"2010","unstructured":"Romero C, Ventura S (2010) Educational data mining: a review of the state of the art. IEEE Trans Syst Man Cybern Part C 40(6):601\u2013618","journal-title":"IEEE Trans Syst Man Cybern Part C"},{"key":"1658_CR2","doi-asserted-by":"crossref","unstructured":"Xu Z, Ke Y (2016) Effective and efficient spectral clustering on text and link data. In: Proceedings of ACM international conference on information and knowledge management. pp 357\u2013366","DOI":"10.1145\/2983323.2983708"},{"key":"1658_CR3","unstructured":"Shaham U, Stanton K, Li H, Nadler B, Basri R, Kluger Y (2018) Spectralnet: spectral clustering using deep neural networks. In: Proceedings of international conference on learning representations"},{"key":"1658_CR4","doi-asserted-by":"publisher","first-page":"192","DOI":"10.1016\/j.eswa.2019.05.030","volume":"134","author":"R Janani","year":"2019","unstructured":"Janani R, Vijayarani S (2019) Text document clustering using spectral clustering algorithm with particle swarm optimization. Expert Syst Appl 134:192\u2013200","journal-title":"Expert Syst Appl"},{"key":"1658_CR5","doi-asserted-by":"publisher","first-page":"149","DOI":"10.1016\/j.ins.2015.03.038","volume":"311","author":"T Basu","year":"2015","unstructured":"Basu T, Murthy CA (2015) A similarity assessment technique for effective grouping of documents. Inf Sci 311:149\u2013162","journal-title":"Inf Sci"},{"issue":"6","key":"1658_CR6","doi-asserted-by":"publisher","first-page":"532","DOI":"10.1006\/cgip.1993.1040","volume":"55","author":"CA Glasbey","year":"1993","unstructured":"Glasbey CA (1993) An analysis of histogram-based thresholding algorithms. CVGIP Graph Models Image Process 55(6):532\u2013537","journal-title":"CVGIP Graph Models Image Process"},{"key":"1658_CR7","unstructured":"Ng AY, Jordan MI, Weiss Y (2002) On spectral clustering: analysis and an algorithm. In: Advances in neural information processing systems. pp 849\u2013856"},{"issue":"9","key":"1658_CR8","doi-asserted-by":"publisher","first-page":"1066","DOI":"10.3390\/sym11091066","volume":"11","author":"M Kaya","year":"2019","unstructured":"Kaya M, Bilge H\u015e (2019) Deep metric learning: a survey. Symmetry 11(9):1066","journal-title":"Symmetry"},{"key":"1658_CR9","doi-asserted-by":"crossref","unstructured":"Davis JV, Kulis B, Jain P, Sra S, Dhillon IS (2007) Information-theoretic metric learning. In: Proceedings of international conference on machine learning. pp 209\u2013216","DOI":"10.1145\/1273496.1273523"},{"issue":"2","key":"1658_CR10","first-page":"207","volume":"10","author":"KQ Weinberger","year":"2009","unstructured":"Weinberger KQ, Saul LK (2009) Distance metric learning for large margin nearest neighbor classification. J Mach Learn Res 10(2):207","journal-title":"J Mach Learn Res"},{"issue":"4","key":"1658_CR11","doi-asserted-by":"publisher","first-page":"287","DOI":"10.1561\/2200000019","volume":"5","author":"B Kulis","year":"2012","unstructured":"Kulis B et al (2012) Metric learning: a survey. Found Trends Mach Learn 5(4):287\u2013364","journal-title":"Found Trends Mach Learn"},{"key":"1658_CR12","doi-asserted-by":"crossref","unstructured":"Dai G, Xie J, Zhu F, Fang Y (2017) Deep correlated metric learning for sketch-based 3d shape retrieval. In: Proceedings of AAAI conference on artificial intelligence","DOI":"10.1109\/TIP.2018.2817042"},{"key":"1658_CR13","doi-asserted-by":"crossref","unstructured":"Harwood B, Kumar\u00a0BGV, Carneiro G, Reid I, Drummond T (2017) Smart mining for deep metric learning. In: Proceedings of the IEEE international conference on computer vision. pp 2821\u20132829","DOI":"10.1109\/ICCV.2017.307"},{"key":"1658_CR14","unstructured":"Strehl A, Ghosh J, Mooney R (2000) Impact of similarity measures on web-page clustering. In: Workshop on artificial intelligence for web search. 58:64"},{"key":"1658_CR15","unstructured":"Huang A (2008) Similarity measures for text document clustering. In: Proceedings of the New Zealand computer science research student conference, Christchurch, New Zealand. pp 49\u201356"},{"issue":"1","key":"1658_CR16","doi-asserted-by":"publisher","first-page":"66","DOI":"10.13176\/11.459","volume":"8","author":"T Basu","year":"2013","unstructured":"Basu T, Murthy CA (2013) Cues: a new hierarchical approach for document clustering. J Pattern Recognit Res 8(1):66\u201384","journal-title":"J Pattern Recognit Res"},{"key":"1658_CR17","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-13-7403-6_9","author":"A Ghosal","year":"2020","unstructured":"Ghosal A, Nandy A, Das AK, Goswami S, Panday M (2020) A short review on different clustering techniques and their applications. Emerg Technol Modell Graph. https:\/\/doi.org\/10.1007\/978-981-13-7403-6_9","journal-title":"Emerg Technol Modell Graph"},{"issue":"8","key":"1658_CR18","doi-asserted-by":"publisher","first-page":"68","DOI":"10.1109\/2.781637","volume":"32","author":"G Karypis","year":"1999","unstructured":"Karypis G, Han E-H, Kumar V (1999) Chameleon: hierarchical clustering using dynamic modeling. Computer 32(8):68\u201375","journal-title":"Computer"},{"issue":"3","key":"1658_CR19","doi-asserted-by":"publisher","first-page":"267","DOI":"10.1109\/TETC.2014.2330519","volume":"2","author":"A Fahad","year":"2014","unstructured":"Fahad A, Alshatri N, Tari Z, Alamri A, Khalil I, Zomaya AY, Foufou S, Bouras A (2014) A survey of clustering algorithms for big data: taxonomy and empirical analysis. IEEE Trans Emerg Top Comput 2(3):267\u2013279","journal-title":"IEEE Trans Emerg Top Comput"},{"issue":"3","key":"1658_CR20","doi-asserted-by":"publisher","first-page":"264","DOI":"10.1145\/331499.331504","volume":"31","author":"K Jain Anil","year":"1999","unstructured":"Jain Anil K, Narasimha Murty M, Flynn Patrick J (1999) Data clustering: a review. ACM Comput Surv 31(3):264\u2013323","journal-title":"ACM Comput Surv"},{"key":"1658_CR21","doi-asserted-by":"crossref","unstructured":"Cutting DR, Karger DR, Pedersen JO, Tukey JW (1992)Scatter\/gather: a cluster-based approach to browsing large document collections. In: Proceedings of the 15th annual international ACM SIGIR conference on Research and development in information retrieval. pp 318\u2013329. ACM","DOI":"10.1145\/133160.133214"},{"key":"1658_CR22","doi-asserted-by":"crossref","unstructured":"Xu W, Liu X, Gong Y (2003) Document clustering based on non-negative matrix factorization. In: Proceedings of the 26th annual international ACM SIGIR conference on research and development in informaion retrieval. pp 267\u2013273. ACM","DOI":"10.1145\/860435.860485"},{"issue":"6","key":"1658_CR23","doi-asserted-by":"publisher","first-page":"1336","DOI":"10.1109\/TKDE.2012.51","volume":"25","author":"Y-X Wang","year":"2013","unstructured":"Wang Y-X, Zhang Y-J (2013) Nonnegative matrix factorization: a comprehensive review. IEEE Trans Knowl Data Eng 25(6):1336\u20131353","journal-title":"IEEE Trans Knowl Data Eng"},{"issue":"1","key":"1658_CR24","doi-asserted-by":"publisher","first-page":"45","DOI":"10.1109\/TPAMI.2008.277","volume":"32","author":"CHQ Ding","year":"2008","unstructured":"Ding CHQ, Li T, Jordan MI (2008) Convex and semi-nonnegative matrix factorizations. IEEE Trans Pattern Anal Mach Intell 32(1):45\u201355","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"3","key":"1658_CR25","doi-asserted-by":"publisher","first-page":"417","DOI":"10.1109\/TPAMI.2016.2554555","volume":"39","author":"G Trigeorgis","year":"2017","unstructured":"Trigeorgis G, Bousmalis K, Zafeiriou S, Schuller BW (2017) A deep matrix factorization method for learning attribute representations. IEEE Trans Pattern Anal Mach Intell 39(3):417\u2013429","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"9","key":"1658_CR26","doi-asserted-by":"publisher","first-page":"2138","DOI":"10.1109\/TKDE.2013.65","volume":"26","author":"Z Li","year":"2014","unstructured":"Li Z, Liu J, Yang Y, Zhou X, Lu H (2014) Clustering-guided sparse structural learning for unsupervised feature selection. IEEE Trans Knowl Data Eng 26(9):2138\u20132150","journal-title":"IEEE Trans Knowl Data Eng"},{"issue":"5","key":"1658_CR27","doi-asserted-by":"publisher","first-page":"1083","DOI":"10.1109\/TCYB.2014.2344015","volume":"45","author":"Y Yang","year":"2015","unstructured":"Yang Y, Ma Z, Yang Y, Nie F, Heng TS (2015) Multitask spectral clustering by exploring intertask correlation. IEEE Trans Cybern 45(5):1083\u20131094","journal-title":"IEEE Trans Cybern"},{"issue":"12","key":"1658_CR28","doi-asserted-by":"publisher","first-page":"1624","DOI":"10.1109\/TKDE.2005.198","volume":"17","author":"D Cai","year":"2005","unstructured":"Cai D, He X, Han J (2005) Document clustering using locality preserving indexing. IEEE Trans Knowl Data Eng 17(12):1624\u20131637","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"1658_CR29","first-page":"1735","volume":"2","author":"R Hadsell","year":"2006","unstructured":"Hadsell R, Chopra S, LeCun Y (2006) Dimensionality reduction by learning an invariant mapping. Proc Conf Comput Visi Pattern Recognit 2:1735\u20131742","journal-title":"Proc Conf Comput Visi Pattern Recognit"},{"key":"1658_CR30","volume-title":"Introduction to modern information retrieval","author":"G Salton","year":"1983","unstructured":"Salton G, McGill MJ (1983) Introduction to modern information retrieval. McGraw Hill, New York"},{"key":"1658_CR31","doi-asserted-by":"crossref","unstructured":"Sam HE-H, Karypis G (2000) Centroid-based document classification: analysis and experimental results. In: European conference on principles of data mining and knowledge discovery. pp 424\u2013431. Springer","DOI":"10.1007\/3-540-45372-5_46"},{"key":"1658_CR32","first-page":"2837","volume":"11","author":"NX Vinh","year":"2010","unstructured":"Vinh NX, Epps J, Bailey J (2010) Information theoretic measures for clusterings comparison: variants, properties, normalization and correction for chance. J Mach Learn Res 11:2837\u20132854","journal-title":"J Mach Learn Res"},{"key":"1658_CR33","unstructured":"Rosenberg A, Hirschberg J (2007) V-measure: a conditional entropy-based external cluster evaluation measure. In: Proceedings of joint conference on empirical methods in natural language processing and computational natural language learning (EMNLP-CoNLL)"},{"key":"1658_CR34","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa F, Varoquaux G, Gramfort A, Michel V, Thirion B, Grisel O, Blondel M, Prettenhofer P, Weiss R, Dubourg V et al (2011) Scikit-learn: machine learning in python. J Mach Learn Res 12:2825\u20132830","journal-title":"J Mach Learn Res"},{"issue":"4","key":"1658_CR35","doi-asserted-by":"publisher","first-page":"688","DOI":"10.1093\/beheco\/ark016","volume":"17","author":"D Ruxton Graeme","year":"2006","unstructured":"Ruxton Graeme D (2006) The unequal variance t-test is an underused alternative to student\u2019s t-test and the mann-whitney u test. Behav Ecol 17(4):688\u2013690","journal-title":"Behav Ecol"},{"key":"1658_CR36","unstructured":"Friedman JH et\u00a0al (1994) Flexible metric nearest neighbor classification. Technical report, Technical report, Department of Statistics, Stanford University"},{"issue":"3","key":"1658_CR37","doi-asserted-by":"publisher","first-page":"1061","DOI":"10.1016\/j.patcog.2011.08.012","volume":"45","author":"R De Amorim","year":"2012","unstructured":"De Amorim R, Cordeiro R, Boris M (2012) Minkowski metric, feature weighting and anomalous cluster initializing in k-means clustering. Pattern Recogn 45(3):1061\u20131075","journal-title":"Pattern Recogn"}],"container-title":["Knowledge and Information Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10115-022-01658-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10115-022-01658-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10115-022-01658-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,3,7]],"date-time":"2022-03-07T04:19:00Z","timestamp":1646626740000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10115-022-01658-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,2,17]]},"references-count":37,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2022,3]]}},"alternative-id":["1658"],"URL":"https:\/\/doi.org\/10.1007\/s10115-022-01658-9","relation":{},"ISSN":["0219-1377","0219-3116"],"issn-type":[{"type":"print","value":"0219-1377"},{"type":"electronic","value":"0219-3116"}],"subject":[],"published":{"date-parts":[[2022,2,17]]},"assertion":[{"value":"29 September 2019","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 January 2022","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"21 January 2022","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 February 2022","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}