{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,21]],"date-time":"2026-02-21T00:46:26Z","timestamp":1771634786758,"version":"3.50.1"},"reference-count":50,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"11","license":[{"start":{"date-parts":[[2024,11,1]],"date-time":"2024-11-01T00:00:00Z","timestamp":1730419200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0\/"}],"funder":[{"name":"Huawei Technologies Canada Company, Ltd."},{"name":"Mitacs Accelerate Program"},{"DOI":"10.13039\/501100001602","name":"Science Foundation Ireland","doi-asserted-by":"publisher","award":["13\/RC\/2094-2"],"award-info":[{"award-number":["13\/RC\/2094-2"]}],"id":[{"id":"10.13039\/501100001602","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100000038","name":"Natural Sciences and Engineering Research Council of Canada","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100000038","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100021202","name":"Alliance de recherche num\u00e9rique du Canada","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100021202","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IIEEE Trans. Software Eng."],"published-print":{"date-parts":[[2024,11]]},"DOI":"10.1109\/tse.2024.3469582","type":"journal-article","created":{"date-parts":[[2024,9,30]],"date-time":"2024-09-30T17:27:03Z","timestamp":1727717223000},"page":"3053-3070","source":"Crossref","is-referenced-by-count":6,"title":["LTM: Scalable and Black-Box Similarity-Based Test Suite Minimization Based on Language Models"],"prefix":"10.1109","volume":"50","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9096-6241","authenticated-orcid":false,"given":"Rongqi","family":"Pan","sequence":"first","affiliation":[{"name":"School of EECS, University of Ottawa, Ottawa, ON, Canada"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9336-7298","authenticated-orcid":false,"given":"Taher A.","family":"Ghaleb","sequence":"additional","affiliation":[{"name":"Computer Science Department, Trent University, Peterborough, ON, Canada"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1393-1010","authenticated-orcid":false,"given":"Lionel C.","family":"Briand","sequence":"additional","affiliation":[{"name":"Lero SFI Centre for Software Research, University of Limerick, Limerick, Ireland"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2018.2809600"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1145\/2430536.2430540"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1002\/stv.430"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1007\/s10664-021-10066-6"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1016\/j.infsof.2019.06.009"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICSE.2019.00055"},{"key":"ref7","doi-asserted-by":"crossref","first-page":"38","DOI":"10.1145\/3194718.3194731","article-title":"Testing and continuous integration at scale: Limits, costs, and expectations","volume-title":"Proc. 11th Int. Workshop Search-Based Softw. Testing","author":"Herzig","year":"2018"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICSE48619.2023.00146"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-35510-4_4"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.findings-emnlp.139"},{"key":"ref11","article-title":"GraphCodeBERT: Pre-training code representations with data flow","author":"Guo","year":"2020"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.acl-long.499"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1108\/ws.2000.07949fab.004"},{"key":"ref14","article-title":"Code Llama: Open foundation models for code","author":"Rozi\u00e8","year":"2023"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-16573-3_6"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1145\/3644388"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1016\/j.jss.2016.06.058"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/SANER.2018.8330200"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/iThings\/CPSCom.2011.135"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1016\/j.jss.2019.03.011"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2022.3170272"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1310.4546"},{"key":"ref23","article-title":"BERT: Pre-training of deep bidirectional transformers for language understanding","author":"Devlin","year":"2018"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1410"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/d18-2029"},{"key":"ref26","first-page":"143","article-title":"A probabilistic analysis of the Rocchio algorithm with TFIDF for text categorization","volume-title":"Proc. Int. Conf. Mach. Learning","volume":"97","author":"Joachims","year":"1997"},{"key":"ref27","first-page":"957","article-title":"From word embeddings to document distances","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Kusner","year":"2015"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ICSE.2019.00054"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/4235.996017"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1145\/3540250.3549089"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1613\/jair.2934"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1090\/conm\/026\/737400"},{"issue":"2","key":"ref33","first-page":"19","article-title":"A survey on similarity measures in text mining","volume":"3","author":"Vijaymeena","year":"2016","journal-title":"Mach. Learn. Appl. Int. J."},{"key":"ref34","article-title":"CodeXGLUE: A machine learning benchmark dataset for code understanding and generation","author":"Lu","year":"2021"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/p16-1162"},{"key":"ref36","article-title":"CodeSearchNet challenge: Evaluating the state of semantic code search","author":"Husain","year":"2019"},{"key":"ref37","article-title":"The stack: 3 TB of permissively licensed source code","author":"Kocetkov","year":"2022"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref39","article-title":"ELECTRA: Pre-training text encoders as discriminators rather than generators","author":"Clark","year":"2020"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.emnlp-main.552"},{"key":"ref41","article-title":"Universal text representation from BERT: An empirical study","author":"Ma","year":"2019"},{"issue":"13","key":"ref42","first-page":"13","article-title":"A survey of text similarity approaches","volume":"68","author":"Gomaa","year":"2013","journal-title":"Int. J. Comput. Appl."},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-00234-2_1"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.2990567"},{"key":"ref45","article-title":"LTM: Scalable and black-box similarity-based test suite minimization based on language models (replication package)","author":"Pan","year":"2023"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1111\/j.1558-5646.1995.tb04456.x"},{"issue":"24","key":"ref47","first-page":"5614","article-title":"Effectiveness of the euclidean distance in high dimensional spaces","volume-title":"Optik","volume":"126","author":"Xia","year":"2015"},{"key":"ref48","article-title":"Large language models for software engineering:","volume-title":"Survey and open problems","author":"Fan","year":"2023"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/TPWRD.2019.2962275"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/TSE.2022.3201209"}],"container-title":["IEEE Transactions on Software Engineering"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/32\/10752626\/10697930.pdf?arnumber=10697930","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,27]],"date-time":"2024-11-27T00:36:52Z","timestamp":1732667812000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10697930\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11]]},"references-count":50,"journal-issue":{"issue":"11"},"URL":"https:\/\/doi.org\/10.1109\/tse.2024.3469582","relation":{},"ISSN":["0098-5589","1939-3520","2326-3881"],"issn-type":[{"value":"0098-5589","type":"print"},{"value":"1939-3520","type":"electronic"},{"value":"2326-3881","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,11]]}}}