{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T00:05:51Z","timestamp":1740096351808,"version":"3.37.3"},"publisher-location":"Berlin, Heidelberg","reference-count":48,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642452598"},{"type":"electronic","value":"9783642452604"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2013]]},"DOI":"10.1007\/978-3-642-45260-4_9","type":"book-chapter","created":{"date-parts":[[2013,11,18]],"date-time":"2013-11-18T09:56:14Z","timestamp":1384768574000},"page":"117-134","source":"Crossref","is-referenced-by-count":3,"title":["Using Machine Learning and Information Retrieval Techniques to Improve Software Maintainability"],"prefix":"10.1007","author":[{"given":"Anna","family":"Corazza","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sergio","family":"Di Martino","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Valerio","family":"Maggio","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Alessandro","family":"Moschitti","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Andrea","family":"Passerini","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Giuseppe","family":"Scanniello","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Fabrizio","family":"Silvestri","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","reference":[{"key":"9_CR1","first-page":"235","volume-title":"Proceedings of the 6th Working Conference on Reverse Engineering","author":"N. Anquetil","year":"1999","unstructured":"Anquetil, N., Fourrier, C., Lethbridge, T.C.: Experiments with clustering as a software remodularization method. In: Proceedings of the 6th Working Conference on Reverse Engineering, pp. 235\u2013255. IEEE Computer Society, Washington, DC (1999)"},{"unstructured":"Baker, B.: On finding duplication and near-duplication in large software systems. In: IEEE Proceedings of the Working Conference on Reverse Engineering (1995)","key":"9_CR2"},{"unstructured":"Baxter, I.D., Yahin, A., Moura, L., Sant\u2019Anna, M., Bier, L.: Clone detection using abstract syntax trees. In: Proceedings of the International Conference on Software Maintenance, pp. 368\u2013377. IEEE Press (1998)","key":"9_CR3"},{"doi-asserted-by":"crossref","unstructured":"Bellon, S., Koschke, R., Antoniol, G., Krinke, J., Merlo, E.M.: Comparison and evaluation of clone detection tools. IEEE Trans. Software Eng., 577\u2013591 (September 2007)","key":"9_CR4","DOI":"10.1109\/TSE.2007.70725"},{"key":"9_CR5","first-page":"251","volume-title":"Proceedings of the European Conference on Software Maintenance and Reengineering","author":"R.A. Bittencourt","year":"2009","unstructured":"Bittencourt, R.A., Guerrero, D.D.S.: Comparison of graph clustering algorithms for recovering software architecture module views. In: Proceedings of the European Conference on Software Maintenance and Reengineering, pp. 251\u2013254. IEEE Computer Society, Washington, DC (2009), http:\/\/portal.acm.org\/citation.cfm?id=1545011.1545446"},{"doi-asserted-by":"crossref","unstructured":"Bulychev, P., Minea, M.: Duplicate code detection using anti-unification. In: Spring\/Summer Young Researcher\u2019s Colloquium (2008)","key":"9_CR6","DOI":"10.15514\/SYRCOSE-2008-2-22"},{"key":"9_CR7","doi-asserted-by":"publisher","first-page":"35","DOI":"10.1109\/CSMR.2011.8","volume-title":"Proceedings of the 15th European Conference on Software Maintenance and Reengineering, CSMR 2011","author":"A. Corazza","year":"2011","unstructured":"Corazza, A., Di Martino, S., Maggio, V., Scanniello, G.: Investigating the use of lexical information for software system clustering. In: Proceedings of the 15th European Conference on Software Maintenance and Reengineering, CSMR 2011, pp. 35\u201344. IEEE Computer Society, Washington, DC (2011), http:\/\/dx.doi.org\/10.1109\/CSMR.2011.8"},{"doi-asserted-by":"crossref","unstructured":"Corazza, A., Di Martino, S., Scanniello, G.: A probabilistic based approach towards software system clustering. In: Proceedings of the European Conference on Software Maintenance and Reengineering, pp. 88\u201396 (2010)","key":"9_CR8","DOI":"10.1109\/CSMR.2010.36"},{"key":"9_CR9","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/ICSM.2010.5609715","volume-title":"Proceedings of the 2010 IEEE International Conference on Software Maintenance, ICSM 2010","author":"A. Corazza","year":"2010","unstructured":"Corazza, A., Di Martino, S., Maggio, V., Scanniello, G.: A tree kernel based approach for clone detection. In: Proceedings of the 2010 IEEE International Conference on Software Maintenance, ICSM 2010, pp. 1\u20135. IEEE Computer Society, Washington, DC (2010), http:\/\/dx.doi.org\/10.1109\/ICSM.2010.5609715"},{"key":"9_CR10","series-title":"CCIS","doi-asserted-by":"publisher","first-page":"42","DOI":"10.1007\/978-3-642-28033-7_5","volume-title":"Eternal Systems","author":"A. Corazza","year":"2012","unstructured":"Corazza, A., Di Martino, S., Maggio, V., Scanniello, G.: Combining machine learning and information retrieval techniques for software clustering. In: Moschitti, A., Scandariato, R. (eds.) EternalS 2011. CCIS, vol.\u00a0255, pp. 42\u201360. Springer, Heidelberg (2012)"},{"issue":"6","key":"9_CR11","doi-asserted-by":"publisher","first-page":"391","DOI":"10.1002\/(SICI)1097-4571(199009)41:6<391::AID-ASI1>3.0.CO;2-9","volume":"41","author":"S.C. Deerwester","year":"1990","unstructured":"Deerwester, S.C., Dumais, S.T., Landauer, T.K., Furnas, G.W., Harshman, R.A.: Indexing by latent semantic analysis. Journal of the American Society of Information Science\u00a041(6), 391\u2013407 (1990), http:\/\/citeseerx.ist.psu.edu\/viewdoc\/summary?doi=10.1.1.49.7546","journal-title":"Journal of the American Society of Information Science"},{"key":"9_CR12","first-page":"73","volume-title":"Proceedings of the Software Technology and Engineering Practice","author":"D. Doval","year":"1999","unstructured":"Doval, D., Mancoridis, S., Mitchell, B.S.: Automatic clustering of software systems using a genetic algorithm. In: Proceedings of the Software Technology and Engineering Practice, pp. 73\u201382. IEEE Computer Society, Washington, DC (1999), http:\/\/portal.acm.org\/citation.cfm?id=829540.832036"},{"issue":"4","key":"9_CR13","doi-asserted-by":"publisher","first-page":"573","DOI":"10.1109\/TSE.2009.19","volume":"35","author":"S. Ducasse","year":"2009","unstructured":"Ducasse, S., Pollet, D.: Software architecture reconstruction: A process-oriented taxonomy. IEEE Transactions on Software Engineering\u00a035(4), 573\u2013591 (2009)","journal-title":"IEEE Transactions on Software Engineering"},{"doi-asserted-by":"crossref","unstructured":"Ducasse, S., Rieger, M., Demeyer, S.: A language independent approach for detecting duplicated code. In: Proceedings of the International Conference on Software Maintenance, pp. 109\u2013118 (1999)","key":"9_CR14","DOI":"10.1109\/ICSM.1999.792593"},{"key":"9_CR15","first-page":"217","volume-title":"Proceedings of the 22nd International Conference on Machine Learning, ICML 2005","author":"T. Finley","year":"2005","unstructured":"Finley, T., Joachims, T.: Supervised clustering with support vector machines. In: Proceedings of the 22nd International Conference on Machine Learning, ICML 2005, pp. 217\u2013224. ACM, New York (2005), http:\/\/doi.acm.org\/10.1145\/1102351.1102379"},{"key":"9_CR16","series-title":"Lecture Notes in Artificial Intelligence","doi-asserted-by":"publisher","first-page":"56","DOI":"10.1007\/978-3-540-78652-8_3","volume-title":"Probabilistic Inductive Logic Programming","author":"P. Frasconi","year":"2008","unstructured":"Frasconi, P., Passerini, A.: Learning with kernels and logical representations. In: De Raedt, L., Frasconi, P., Kersting, K., Muggleton, S. (eds.) Probabilistic Inductive Logic Programming. LNCS (LNAI), vol.\u00a04911, pp. 56\u201391. Springer, Heidelberg (2008)"},{"key":"9_CR17","first-page":"321","volume-title":"Proceedings of the 30th International Conference on Software Engineering, ICSE 2008","author":"M. Gabel","year":"2008","unstructured":"Gabel, M., Jiang, L., Su, Z.: Scalable detection of semantic clones. In: Proceedings of the 30th International Conference on Software Engineering, ICSE 2008, pp. 321\u2013330. ACM, New York (2008), http:\/\/doi.acm.org\/10.1145\/1368088.1368132"},{"key":"9_CR18","doi-asserted-by":"crossref","first-page":"91","DOI":"10.1145\/336512.336537","volume-title":"Proceedings of the Conference on the Future of Software Engineering, ICSE 2000","author":"D. Garlan","year":"2000","unstructured":"Garlan, D.: Software architecture: a roadmap. In: Proceedings of the Conference on the Future of Software Engineering, ICSE 2000, pp. 91\u2013101. ACM, New York (2000), http:\/\/doi.acm.org\/10.1145\/336512.336537"},{"unstructured":"G\u00f6nen, M., Alpaydin, E.: Multiple kernel learning algorithms. J. Mach. Learn. Res., 2211\u20132268 (July 2011)","key":"9_CR19"},{"issue":"3","key":"9_CR20","doi-asserted-by":"publisher","first-page":"1171","DOI":"10.1214\/009053607000000677","volume":"36","author":"T. Hofmann","year":"2008","unstructured":"Hofmann, T., Sch\u00f6lkopf, B., Smola, A.J.: Kernel methods in machine learning. Annals of Statistics\u00a036(3), 1171\u20131220 (2008), http:\/\/www.projecteuclid.org\/DPubS?verb=Displayversion=1.0service=UIhandle=euclid.aos\/1211819561page=record","journal-title":"Annals of Statistics"},{"key":"9_CR21","first-page":"96","volume-title":"Proceedings of the 29th International Conference on Software Engineering, ICSE 2007","author":"L. Jiang","year":"2007","unstructured":"Jiang, L., Misherghi, G., Su, Z., Glondu, S.: Deckard: Scalable and accurate tree-based detection of code clones. In: Proceedings of the 29th International Conference on Software Engineering, ICSE 2007, pp. 96\u2013105. IEEE Computer Society, Washington, DC (2007), http:\/\/dx.doi.org\/10.1109\/ICSE.2007.30"},{"unstructured":"Johnson, J.H.: Identifying redundancy in source code using fingerprints. In: Proc. Conf. Centre for Advanced Studies on Collaborative Research (CASCON), pp. 171\u2013183. IBM Press (1993)","key":"9_CR22"},{"issue":"7","key":"9_CR23","doi-asserted-by":"publisher","first-page":"654","DOI":"10.1109\/TSE.2002.1019480","volume":"28","author":"T. Kamiya","year":"2002","unstructured":"Kamiya, T., Kusumoto, S., Inoue, K.: Ccfinder: A multilinguistic token-based code clone detection system for large scale source code. IEEE Trans. Software Eng.\u00a028(7), 654\u2013670 (2002)","journal-title":"IEEE Trans. Software Eng."},{"key":"9_CR24","doi-asserted-by":"publisher","first-page":"604","DOI":"10.1145\/324133.324140","volume":"46","author":"J.M. Kleinberg","year":"1999","unstructured":"Kleinberg, J.M.: Authoritative sources in a hyperlinked environment. Journal of the ACM\u00a046, 604\u2013632 (1999), http:\/\/doi.acm.org\/10.1145\/324133.324140","journal-title":"Journal of the ACM"},{"key":"9_CR25","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"40","DOI":"10.1007\/3-540-47764-0_3","volume-title":"Static Analysis","author":"R. Komondoor","year":"2001","unstructured":"Komondoor, R., Horwitz, S.: Using slicing to identify duplication in source code. In: Cousot, P. (ed.) SAS 2001. LNCS, vol.\u00a02126, pp. 40\u201356. Springer, Heidelberg (2001)"},{"unstructured":"Koschke, R.: Atomic architectural component recovery for program understanding and evolution. Softwaretechnik-Trends (2000), http:\/\/www.iste.uni-stuttgart.de\/ps\/rainer\/thesis","key":"9_CR26"},{"key":"9_CR27","doi-asserted-by":"publisher","first-page":"253","DOI":"10.1109\/WCRE.2006.18","volume-title":"WCRE 2006: Proceedings of the 13th Working Conference on Reverse Engineering","author":"R. Koschke","year":"2006","unstructured":"Koschke, R., Falke, R., Frenzel, P.: Clone detection using abstract syntax suffix trees. In: WCRE 2006: Proceedings of the 13th Working Conference on Reverse Engineering, pp. 253\u2013262. IEEE Computer Society, Washington, DC (2006)"},{"unstructured":"Krinke, J.: Identifying Similar Code with Program Dependence Graphs. In: Proc. Working Conf. Reverse Engineering (WCRE), pp. 301\u2013309. IEEE Computer Society Press (2001)","key":"9_CR28"},{"key":"9_CR29","doi-asserted-by":"publisher","first-page":"230","DOI":"10.1016\/j.infsof.2006.10.017","volume":"49","author":"A. Kuhn","year":"2007","unstructured":"Kuhn, A., Ducasse, S., G\u00edrba, T.: Semantic clustering: Identifying topics in source code. Information and Software Technology\u00a049, 230\u2013243 (2007), http:\/\/portal.acm.org\/citation.cfm?id=1224560.1224698","journal-title":"Information and Software Technology"},{"issue":"3","key":"9_CR30","doi-asserted-by":"publisher","first-page":"305","DOI":"10.1007\/s10994-009-5163-1","volume":"78","author":"N. Landwehr","year":"2010","unstructured":"Landwehr, N., Passerini, A., Raedt, L., Frasconi, P.: Fast learning of relational kernels. Mach. Learn.\u00a078(3), 305\u2013342 (2010), http:\/\/dx.doi.org\/10.1007\/s10994-009-5163-1","journal-title":"Mach. Learn."},{"issue":"9","key":"9_CR31","doi-asserted-by":"publisher","first-page":"1060","DOI":"10.1109\/PROC.1980.11805","volume":"68","author":"M.M. Lehman","year":"1980","unstructured":"Lehman, M.M.: Programs, life cycles, and laws of software evolution. Proc. IEEE\u00a068(9), 1060\u20131076 (1980)","journal-title":"Proc. IEEE"},{"issue":"4","key":"9_CR32","doi-asserted-by":"publisher","first-page":"361","DOI":"10.1023\/B:SQJO.0000039793.31052.72","volume":"12","author":"A.M. Leit\u00e3o","year":"2004","unstructured":"Leit\u00e3o, A.M.: Detection of redundant code using r2d2. Software Quality Journal\u00a012(4), 361\u2013382 (2004)","journal-title":"Software Quality Journal"},{"key":"9_CR33","doi-asserted-by":"publisher","first-page":"103","DOI":"10.1109\/ICSE.2001.919085","volume-title":"Proceedings of the 23rd International Conference on Software Engineering, ICSE 2001","author":"J.I. Maletic","year":"2001","unstructured":"Maletic, J.I., Marcus, A.: Supporting program comprehension using semantic and structural information. In: Proceedings of the 23rd International Conference on Software Engineering, ICSE 2001, pp. 103\u2013112. IEEE Computer Society, Washington, DC (2001), http:\/\/portal.acm.org\/citation.cfm?id=381473.381484"},{"issue":"11","key":"9_CR34","doi-asserted-by":"publisher","first-page":"759","DOI":"10.1109\/TSE.2007.70732","volume":"33","author":"O. Maqbool","year":"2007","unstructured":"Maqbool, O., Babri, H.: Hierarchical clustering for software architecture recovery. IEEE Transactions on Software Engineering\u00a033(11), 759\u2013780 (2007)","journal-title":"IEEE Transactions on Software Engineering"},{"key":"9_CR35","first-page":"585","volume-title":"Proceedings of the 22nd International Conference on Machine Learning, ICML 2005","author":"S. Menchetti","year":"2005","unstructured":"Menchetti, S., Costa, F., Frasconi, P.: Weighted decomposition kernels. In: Proceedings of the 22nd International Conference on Machine Learning, ICML 2005, pp. 585\u2013592. ACM, New York (2005), http:\/\/doi.acm.org\/10.1145\/1102351.1102425"},{"key":"9_CR36","doi-asserted-by":"publisher","first-page":"193","DOI":"10.1109\/TSE.2006.31","volume":"32","author":"B.S. Mitchell","year":"2006","unstructured":"Mitchell, B.S., Mancoridis, S.: On the automatic modularization of software systems using the bunch tool. IEEE Transactions on Software Engineering\u00a032, 193\u2013208 (2006), http:\/\/portal.acm.org\/citation.cfm?id=1128600.1128815","journal-title":"IEEE Transactions on Software Engineering"},{"key":"9_CR37","first-page":"193","volume-title":"Computational Linguistics","author":"A. Moschitti","year":"2008","unstructured":"Moschitti, A., Basili, R., Pighin, D.: Tree Kernels for Semantic Role Labeling. In: Computational Linguistics, pp. 193\u2013224. MIT Press, Cambridge (2008)"},{"issue":"3","key":"9_CR38","doi-asserted-by":"publisher","first-page":"307","DOI":"10.1007\/s00165-011-0199-y","volume":"24","author":"M. Risi","year":"2012","unstructured":"Risi, M., Scanniello, G., Tortora, G.: Using fold-in and fold-out in the architecture recovery of software systems. Formal Asp. Comput.\u00a024(3), 307\u2013330 (2012)","journal-title":"Formal Asp. Comput."},{"doi-asserted-by":"crossref","unstructured":"Roy, C.K., Cordy, J.R.: Nicad: Accurate detection of near-miss intentional clones using flexible pretty-printing and code normalization. In: ICPC, pp. 172\u2013181 (2008)","key":"9_CR39","DOI":"10.1109\/ICPC.2008.41"},{"issue":"7","key":"9_CR40","doi-asserted-by":"publisher","first-page":"470","DOI":"10.1016\/j.scico.2009.02.007","volume":"74","author":"C.K. Roy","year":"2009","unstructured":"Roy, C.K., Cordy, J.R., Koschke, R.: Comparison and evaluation of code clone detection techniques and tools: A qualitative approach. Sci. Comput. Program.\u00a074(7), 470\u2013495 (2009)","journal-title":"Sci. Comput. Program."},{"key":"9_CR41","doi-asserted-by":"publisher","first-page":"897","DOI":"10.1002\/spe.988","volume":"40","author":"G. Scanniello","year":"2010","unstructured":"Scanniello, G., D\u2019Amico, A., D\u2019Amico, C., D\u2019Amico, T.: Architectural layer recovery for software system understanding and evolution. Software Practice and Experience\u00a040, 897\u2013916 (2010), http:\/\/dx.doi.org\/10.1002\/spe.v40:10","journal-title":"Software Practice and Experience"},{"key":"9_CR42","doi-asserted-by":"publisher","first-page":"180","DOI":"10.1109\/ICPC.2010.17","volume-title":"Proceedings of the IEEE 18th International Conference on Program Comprehension, ICPC 2010","author":"G. Scanniello","year":"2010","unstructured":"Scanniello, G., D\u2019Amico, A., D\u2019Amico, C., D\u2019Amico, T.: Using the kleinberg algorithm and vector space model for software system clustering. In: Proceedings of the IEEE 18th International Conference on Program Comprehension, ICPC 2010, pp. 180\u2013189. IEEE Computer Society, Washington, DC (2010), http:\/\/dx.doi.org\/10.1109\/ICPC.2010.17"},{"unstructured":"Tzerpos, V., Holt, R.C.: On the stability of software clustering algorithms. In: Proceedings of the 8th International Workshop on Program Comprehension, pp. 211\u2013218 (2000)","key":"9_CR43"},{"issue":"1","key":"9_CR44","doi-asserted-by":"crossref","first-page":"S276","DOI":"10.1093\/bioinformatics\/18.suppl_1.S276","volume":"18","author":"J.P. Vert","year":"2002","unstructured":"Vert, J.P.: A Tree Kernel to analyse phylogenetic profiles. Bioinformatics\u00a018(suppl. 1), S276\u2013S284 (2002)","journal-title":"Bioinformatics"},{"key":"9_CR45","doi-asserted-by":"publisher","first-page":"128","DOI":"10.1109\/SCAM.2004.6","volume-title":"SCAM 2004: Proceedings of the Fourth IEEE International Workshop on Source Code Analysis and Manipulation","author":"V. Wahler","year":"2004","unstructured":"Wahler, V., Seipel, D., von Gudenberg, J.W., Fischer, G.: Clone detection in source code by frequent itemset techniques. In: SCAM 2004: Proceedings of the Fourth IEEE International Workshop on Source Code Analysis and Manipulation, pp. 128\u2013135. IEEE Computer Society, Washington, DC (2004)"},{"key":"9_CR46","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1109\/WCRE.1997.624574","volume-title":"Proceedings of the Fourth Working Conference on Reverse Engineering (WCRE 1997)","author":"T.A. Wiggerts","year":"1997","unstructured":"Wiggerts, T.A.: Using clustering algorithms in legacy systems remodularization. In: Proceedings of the Fourth Working Conference on Reverse Engineering (WCRE 1997), pp. 33\u201343. IEEE Computer Society, Washington, DC (1997), http:\/\/portal.acm.org\/citation.cfm?id=832304.836999"},{"doi-asserted-by":"crossref","unstructured":"Wu, J., Hassan, A.E., Holt, R.C.: Comparison of clustering algotithms in the context of software evolution. In: Proceedings of the 21st IEEE International Conference on Software Maintenance, pp. 525\u2013535. IEEE Computer Society (2005)","key":"9_CR47","DOI":"10.1109\/ICSM.2005.31"},{"issue":"7","key":"9_CR48","doi-asserted-by":"publisher","first-page":"739","DOI":"10.1002\/spe.4380210706","volume":"21","author":"W. Yang","year":"1991","unstructured":"Yang, W.: Identifying syntactic differences between two programs. Software - Practice and Experience\u00a021(7), 739\u2013755 (1991)","journal-title":"Software - Practice and Experience"}],"container-title":["Communications in Computer and Information Science","Trustworthy Eternal Systems via Evolving Software, Data and Knowledge"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-45260-4_9","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,3,12]],"date-time":"2022-03-12T18:08:08Z","timestamp":1647108488000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-45260-4_9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013]]},"ISBN":["9783642452598","9783642452604"],"references-count":48,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-45260-4_9","relation":{},"ISSN":["1865-0929","1865-0937"],"issn-type":[{"type":"print","value":"1865-0929"},{"type":"electronic","value":"1865-0937"}],"subject":[],"published":{"date-parts":[[2013]]}}}