{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,5]],"date-time":"2026-01-05T21:03:43Z","timestamp":1767647023722,"version":"3.48.0"},"reference-count":44,"publisher":"Springer Science and Business Media LLC","issue":"10","license":[{"start":{"date-parts":[[2025,11,20]],"date-time":"2025-11-20T00:00:00Z","timestamp":1763596800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2025,11,20]],"date-time":"2025-11-20T00:00:00Z","timestamp":1763596800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J. King Saud Univ. Comput. Inf. Sci."],"published-print":{"date-parts":[[2025,12]]},"DOI":"10.1007\/s44443-025-00362-2","type":"journal-article","created":{"date-parts":[[2025,11,20]],"date-time":"2025-11-20T08:38:53Z","timestamp":1763627933000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Quantifying cross-language code reuse via function-level clone detection"],"prefix":"10.1007","volume":"37","author":[{"given":"Yi","family":"Rong","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yan","family":"Zhou","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,11,20]]},"reference":[{"key":"362_CR1","doi-asserted-by":"crossref","unstructured":"Abid S, Cai X, Jiang L (2023) Interpreting codebert for semantic code clone detection. In 2023 30th Asia-Pacific Software Engineering Conference (APSEC) (pp 229\u2013238). IEEE","DOI":"10.1109\/APSEC60848.2023.00033"},{"key":"362_CR2","doi-asserted-by":"crossref","unstructured":"Baker B\u00a0S (1995) On finding duplication and near-duplication in large software systems. In: Proceedings of 2nd working conference on reverse engineering (pp 86\u201395). IEEE","DOI":"10.1109\/WCRE.1995.514697"},{"key":"362_CR3","doi-asserted-by":"crossref","unstructured":"Bui N\u00a0D, Yu Y, Jiang L (2021) Infercode: Self-supervised learning of code representations by predicting subtrees. In: 2021 IEEE\/ACM 43rd International Conference on Software Engineering (ICSE) (pp 1186\u20131197). IEEE","DOI":"10.1109\/ICSE43902.2021.00109"},{"key":"362_CR4","doi-asserted-by":"publisher","first-page":"273","DOI":"10.1587\/transinf.2016EDP7334","volume":"100","author":"X Cheng","year":"2017","unstructured":"Cheng X, Peng Z, Jiang L, Zhong H, Yu H, Zhao J (2017) Clcminer: detecting cross-language clones without intermediates. IEICE Trans Inf Syst 100:273\u2013284","journal-title":"IEICE Trans Inf Syst"},{"key":"362_CR5","doi-asserted-by":"crossref","unstructured":"Chilowicz M, Duris E, Roussel G (2009) Syntax tree fingerprinting for source code similarity detection. In: 2009 IEEE 17th international conference on program comprehension (pp 243\u2013247). IEEE","DOI":"10.1109\/ICPC.2009.5090050"},{"key":"362_CR6","doi-asserted-by":"crossref","unstructured":"Cordy J\u00a0R, Roy C\u00a0K (2011) The nicad clone detector. In: 2011 IEEE 19th international conference on program comprehension (pp 219\u2013220). IEEE","DOI":"10.1109\/ICPC.2011.26"},{"key":"362_CR7","doi-asserted-by":"publisher","first-page":"12084","DOI":"10.3390\/app132112084","volume":"13","author":"Y Fang","year":"2023","unstructured":"Fang Y, Zhou F, Xu Y, Liu Z (2023) Tcccd: Triplet-based cross-language code clone detection. Appl Sci 13:12084","journal-title":"Appl Sci"},{"key":"362_CR8","doi-asserted-by":"crossref","unstructured":"Feng Z, Guo D, Tang D, Duan N, Feng X, Gong M, Shou L, Qin B, Liu T, Jiang D, et\u00a0al (2020) Codebert: A pre-trained model for programming and natural languages. arXiv:2002.08155,","DOI":"10.18653\/v1\/2020.findings-emnlp.139"},{"key":"362_CR9","unstructured":"Guo D, Ren S, Lu S, Feng Z, Tang D, Liu S, Zhou L, Duan N, Svyatkovskiy A, Fu S, et\u00a0al (2020) Graphcodebert: Pre-training code representations with data flow. arXiv:2009.08366,"},{"key":"362_CR10","doi-asserted-by":"crossref","unstructured":"Jiang L, Misherghi G, Su Z, Glondu S (2007) Deckard: Scalable and accurate tree-based detection of code clones. In: 29th International Conference on Software Engineering (ICSE\u201907) (pp 96\u2013105). IEEE","DOI":"10.1109\/ICSE.2007.30"},{"key":"362_CR11","doi-asserted-by":"crossref","unstructured":"Juergens E, Deissenboeck F, Hummel B, Wagner S (2009) Do code clones matter? In: 2009 IEEE 31st International Conference on Software Engineering (pp 485\u2013495). IEEE","DOI":"10.1109\/ICSE.2009.5070547"},{"key":"362_CR12","doi-asserted-by":"publisher","first-page":"654","DOI":"10.1109\/TSE.2002.1019480","volume":"28","author":"T Kamiya","year":"2002","unstructured":"Kamiya T, Kusumoto S, Inoue K (2002) Ccfinder: A multilinguistic token-based code clone detection system for large scale source code. IEEE Trans Software Eng 28:654\u2013670","journal-title":"IEEE Trans Software Eng"},{"key":"362_CR13","doi-asserted-by":"crossref","unstructured":"Keivanloo I, Rilling J, Charland P (2011) Internet-scale real-time code clone search via multi-level indexing. In: 2011 18th Working Conference on Reverse Engineering (pp 23\u201327). IEEE","DOI":"10.1109\/WCRE.2011.13"},{"key":"362_CR14","doi-asserted-by":"crossref","unstructured":"Kochhar P\u00a0S, Wijedasa D, Lo D (2016) A large scale study of multiple programming languages and code quality. In: 2016 IEEE 23Rd international conference on software analysis, evolution, and reengineering (SANER) (pp 563\u2013573). IEEE volume\u00a01","DOI":"10.1109\/SANER.2016.112"},{"key":"362_CR15","unstructured":"Koschke R (2007) Survey of research on software clones,"},{"key":"362_CR16","doi-asserted-by":"crossref","unstructured":"Krinke J (2007) A study of consistent and inconsistent changes to code clones. In: 14th working conference on reverse engineering (WCRE 2007) (pp 170\u2013178). IEEE","DOI":"10.1109\/WCRE.2007.7"},{"key":"362_CR17","doi-asserted-by":"crossref","unstructured":"Lei M, Li H, Li J, Aundhkar N, Kim D-K (2022) Deep learning application on code clone detection: A review of current knowledge. J Syst Softw 184:111141","DOI":"10.1016\/j.jss.2021.111141"},{"key":"362_CR18","doi-asserted-by":"crossref","unstructured":"Li L, Feng H, Zhuang W, Meng N, Ryder B (2017) Cclearner: A deep learning-based clone detection approach. In: 2017 IEEE international conference on software maintenance and evolution (ICSME) (pp 249\u2013260). IEEE","DOI":"10.1109\/ICSME.2017.46"},{"key":"362_CR19","doi-asserted-by":"publisher","first-page":"5027198","DOI":"10.1155\/2020\/5027198","volume":"2020","author":"Y Meng","year":"2020","unstructured":"Meng Y, Liu L (2020) [retracted] a deep learning approach for a source code detection model using self-attention. Complexity 2020:5027198","journal-title":"Complexity"},{"key":"362_CR20","doi-asserted-by":"crossref","unstructured":"Mou L, Li G, Zhang L, Wang T, Jin Z (2016) Convolutional neural networks over tree structures for programming language processing. In: Proceedings of the AAAI conference on artificial intelligence. volume\u00a030","DOI":"10.1609\/aaai.v30i1.10139"},{"key":"362_CR21","doi-asserted-by":"crossref","unstructured":"Moumoula M\u00a0B, Kabor\u00e9 A\u00a0K, Klein J, Bissyand\u00e9 T\u00a0F (2024) Large language models for cross-language code clone detection. CoRR,","DOI":"10.1145\/3715764"},{"key":"362_CR22","doi-asserted-by":"crossref","unstructured":"Nafi K\u00a0W, Kar T\u00a0S, Roy B, Roy C\u00a0K, Schneider K\u00a0A (2019) Clcdsa: cross language code clone detection using syntactical features and api documentation. In: 2019 34th IEEE\/ACM International Conference on Automated Software Engineering (ASE) (pp 1026\u20131037). IEEE","DOI":"10.1109\/ASE.2019.00099"},{"key":"362_CR23","doi-asserted-by":"crossref","unstructured":"Perez D, Chiba S (2019) Cross-language clone detection by learning over abstract syntax trees. In: 2019 IEEE\/ACM 16th International Conference on Mining Software Repositories (MSR) (pp 518\u2013528). IEEE","DOI":"10.1109\/MSR.2019.00078"},{"key":"362_CR24","doi-asserted-by":"crossref","unstructured":"Pham N\u00a0H, Nguyen H\u00a0A, Nguyen T\u00a0T, Al-Kofahi J\u00a0M, Nguyen T\u00a0N (2009) Complete and accurate clone detection in graph-based models. In: 2009 IEEE 31st International Conference on Software Engineering (pp 276\u2013286). IEEE","DOI":"10.1109\/ICSE.2009.5070528"},{"key":"362_CR25","first-page":"1016","volume":"8","author":"L Prechelt","year":"2002","unstructured":"Prechelt L, Malpohl G, Philippsen M et al (2002) Finding plagiarisms among a set of programs with jplag. J Univers Comput Sci 8:1016","journal-title":"J Univers Comput Sci"},{"key":"362_CR26","unstructured":"Rabin M\u00a0O (1981) Fingerprinting by random polynomials. Ph.D. thesis Cambridge, MA, USA"},{"key":"362_CR27","doi-asserted-by":"publisher","first-page":"1165","DOI":"10.1016\/j.infsof.2013.01.008","volume":"55","author":"D Rattan","year":"2013","unstructured":"Rattan D, Bhatia R, Singh M (2013) Software clone detection: A systematic review. Inf Softw Technol 55:1165\u20131199","journal-title":"Inf Softw Technol"},{"key":"362_CR28","first-page":"64","volume":"541","author":"CK Roy","year":"2007","unstructured":"Roy CK, Cordy JR (2007) A survey on software clone detection research. Queen\u2019s School Comput TR 541:64\u201368","journal-title":"Queen\u2019s School Comput TR"},{"key":"362_CR29","doi-asserted-by":"crossref","unstructured":"Roy C\u00a0K, Cordy J\u00a0R (2008) Nicad: Accurate detection of near-miss intentional clones using flexible pretty-printing and code normalization. In: 2008 16th iEEE international conference on program comprehension (pp 172\u2013181). IEEE","DOI":"10.1109\/ICPC.2008.41"},{"key":"362_CR30","doi-asserted-by":"crossref","unstructured":"Saini V, Farmahinifarahani F, Lu Y, Baldi P, Lopes C\u00a0V (2018) Oreo: Detection of clones in the twilight zone. In: Proceedings of the 2018 26th ACM joint meeting on European software engineering conference and symposium on the foundations of software engineering (pp 354\u2013365)","DOI":"10.1145\/3236024.3236026"},{"key":"362_CR31","doi-asserted-by":"crossref","unstructured":"Sajnani H, Saini V, Svajlenko J, Roy C\u00a0K, Lopes C\u00a0V (2016) Sourcerercc: Scaling code clone detection to big-code. In: Proceedings of the 38th international conference on software engineering (pp 1157\u20131168)","DOI":"10.1145\/2884781.2884877"},{"key":"362_CR32","doi-asserted-by":"crossref","unstructured":"Svajlenko J, Roy C\u00a0K (2015) Evaluating clone detection tools with bigclonebench. In: 2015 IEEE international conference on software maintenance and evolution (ICSME) (pp 131\u2013140). IEEE","DOI":"10.1109\/ICSM.2015.7332459"},{"key":"362_CR33","doi-asserted-by":"crossref","unstructured":"Svyatkovskiy A, Deng S\u00a0K, Fu S, Sundaresan N (2020) Intellicode compose: Code generation using transformer. In: Proceedings of the 28th ACM joint meeting on European software engineering conference and symposium on the foundations of software engineering (pp 1433\u20131443)","DOI":"10.1145\/3368089.3417058"},{"key":"362_CR34","doi-asserted-by":"crossref","unstructured":"Tao C, Zhan Q, Hu X, Xia X (2022) C4: Contrastive cross-language code clone detection. In: Proceedings of the 30th IEEE\/ACM international conference on program comprehension (pp 413\u2013424)","DOI":"10.1145\/3524610.3527911"},{"key":"362_CR35","doi-asserted-by":"crossref","unstructured":"Vislavski T, Raki\u0107 G, Cardozo N, Budimac Z (2018) Licca: A tool for cross-language clone detection. In: 2018 IEEE 25th international conference on software analysis, evolution and reengineering (SANER) (pp 512\u2013516). IEEE","DOI":"10.1109\/SANER.2018.8330250"},{"key":"362_CR36","doi-asserted-by":"crossref","unstructured":"Wan Z, Xie C, Zeng Y, Hu Y (2025) Code clone detection based on semantic images. Available at SSRN 5333788,","DOI":"10.2139\/ssrn.5333788"},{"key":"362_CR37","doi-asserted-by":"crossref","unstructured":"Wang W, Li G, Ma B, Xia X, Jin Z (2020) Detecting code clones with graph neural network and flow-augmented abstract syntax tree. In: 2020 IEEE 27th International Conference on Software Analysis, Evolution and Reengineering (SANER) (pp 261\u2013271). IEEE","DOI":"10.1109\/SANER48275.2020.9054857"},{"key":"362_CR38","doi-asserted-by":"crossref","unstructured":"Wang Y, Wang W, Joty S, Hoi S\u00a0C (2021) Codet5: Identifier-aware unified pre-trained encoder-decoder models for code understanding and generation. arXiv:2109.00859,","DOI":"10.18653\/v1\/2021.emnlp-main.685"},{"key":"362_CR39","doi-asserted-by":"crossref","unstructured":"Wei H, Li M (2017) Supervised deep features for software functional clone detection by exploiting lexical and syntactical information in source code. In: IJCAI (pp 3034\u20133040)","DOI":"10.24963\/ijcai.2017\/423"},{"key":"362_CR40","doi-asserted-by":"crossref","unstructured":"White M, Tufano M, Vendome C, Poshyvanyk D (2016) Deep learning code fragments for code clone detection. In: Proceedings of the 31st IEEE\/ACM international conference on automated software engineering (pp 87\u201398)","DOI":"10.1145\/2970276.2970326"},{"key":"362_CR41","doi-asserted-by":"crossref","unstructured":"Zhang J, Wang X, Zhang H, Sun H, Wang K, Liu X (2019) A novel neural source code representation based on abstract syntax tree. In: 2019 IEEE\/ACM 41st International Conference on Software Engineering (ICSE) (pp 783\u2013794). IEEE","DOI":"10.1109\/ICSE.2019.00086"},{"key":"362_CR42","doi-asserted-by":"crossref","unstructured":"Zhang Z, Saber T (2025) Ast-enhanced or ast-overloaded? the surprising impact of hybrid graph representations on code clone detection. arXiv:2506.14470,","DOI":"10.1109\/ICSME64153.2025.00033"},{"key":"362_CR43","doi-asserted-by":"crossref","unstructured":"Zhao G, Huang J (2018) Deepsim: deep learning code functional similarity. In: Proceedings of the 2018 26th ACM joint meeting on european software engineering conference and symposium on the foundations of software engineering (pp 141\u2013151)","DOI":"10.1145\/3236024.3236068"},{"key":"362_CR44","unstructured":"Zhu M, Jain A, Suresh K, Ravindran R, Tipirneni S, Reddy C\u00a0K (2022) Xlcost: A benchmark dataset for cross-lingual code intelligence. arXiv:2206.08474,"}],"container-title":["Journal of King Saud University Computer and Information Sciences"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s44443-025-00362-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s44443-025-00362-2","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s44443-025-00362-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,5]],"date-time":"2026-01-05T18:48:33Z","timestamp":1767638913000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s44443-025-00362-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,11,20]]},"references-count":44,"journal-issue":{"issue":"10","published-print":{"date-parts":[[2025,12]]}},"alternative-id":["362"],"URL":"https:\/\/doi.org\/10.1007\/s44443-025-00362-2","relation":{},"ISSN":["1319-1578","2213-1248"],"issn-type":[{"type":"print","value":"1319-1578"},{"type":"electronic","value":"2213-1248"}],"subject":[],"published":{"date-parts":[[2025,11,20]]},"assertion":[{"value":"12 September 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"24 October 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 November 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing Interests"}}],"article-number":"327"}}