{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,23]],"date-time":"2026-06-23T19:30:30Z","timestamp":1782243030236,"version":"3.54.5"},"reference-count":98,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2025,3,6]],"date-time":"2025-03-06T00:00:00Z","timestamp":1741219200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,3,6]],"date-time":"2025-03-06T00:00:00Z","timestamp":1741219200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Empir Software Eng"],"published-print":{"date-parts":[[2025,5]]},"DOI":"10.1007\/s10664-025-10631-3","type":"journal-article","created":{"date-parts":[[2025,3,6]],"date-time":"2025-03-06T03:36:33Z","timestamp":1741232193000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["Towards semantic versioning of open pre-trained language model releases on hugging face"],"prefix":"10.1007","volume":"30","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9212-4566","authenticated-orcid":false,"given":"Adekunle","family":"Ajibode","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Abdul Ali","family":"Bangash","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Filipe R.","family":"Cogo","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Bram","family":"Adams","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Ahmed E.","family":"Hassan","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2025,3,6]]},"reference":[{"key":"10631_CR1","doi-asserted-by":"publisher","first-page":"1107","DOI":"10.1007\/s10664-015-9377-5","volume":"21","author":"SL Abebe","year":"2016","unstructured":"Abebe SL, Ali N, Hassan AE (2016) An empirical study of software release notes. Empir Soft Eng 21:1107\u20131142","journal-title":"Empir Soft Eng"},{"key":"10631_CR2","doi-asserted-by":"crossref","unstructured":"Ahn D, Almaatouq A, Gulabani M, Hosanagar K (2024) Impact of model interpretability and outcome feedback on trust in ai. In Proceedings of the CHI conference on human factors in computing systems, pp 1\u201325","DOI":"10.1145\/3613904.3642780"},{"key":"10631_CR3","unstructured":"Ajibode A (2024) Wip-24: Towards semantic versioning of pre-trained language models. https:\/\/github.com\/SAILResearch\/wip-24-adekunle-lm-release"},{"issue":"3","key":"10631_CR4","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1016\/j.tjem.2018.08.001","volume":"18","author":"H Akoglu","year":"2018","unstructured":"Akoglu H (2018) User\u2019s guide to correlation coefficients. Turk J Emerg Med 18(3):91\u201393","journal-title":"Turk J Emerg Med"},{"issue":"111","key":"10631_CR5","first-page":"1","volume":"21","author":"E Alcoba\u00e7a","year":"2020","unstructured":"Alcoba\u00e7a E, Siqueira F, Rivolli A, Garcia LPF, Oliva JT, De Carvalho ACPLF (2020) Mfe: towards reproducible meta-feature extraction. J Mach Learn Res 21(111):1\u20135","journal-title":"J Mach Learn Res"},{"key":"10631_CR6","doi-asserted-by":"crossref","unstructured":"Ali S, Arcaini P, Pradhan D, Safdar SA, Yue T (2020) Quality indicators in search-based software engineering: an empirical evaluation. ACM Trans Softw Eng Methodol (TOSEM)29(2):1\u201329","DOI":"10.1145\/3375636"},{"key":"10631_CR7","doi-asserted-by":"crossref","unstructured":"Bender EM, Gebru T, McMillan-Major A, Shmitchell S (2021) On the dangers of stochastic parrots: can language models be too big? In Proceedings of the 2021 ACM conference on fairness, accountability, and transparency, pp 610\u2013623","DOI":"10.1145\/3442188.3445922"},{"key":"10631_CR8","doi-asserted-by":"crossref","unstructured":"Bhat A, Coursey A, Hu G, Li S, Nahar N, Zhou S, K\u00e4stner C, Guo JLC (2023) Aspirations and practice of ml model documentation: moving the needle with nudging and traceability. In Proceedings of the 2023 CHI conference on human factors in computing systems, pp 1\u201317","DOI":"10.1145\/3544548.3581518"},{"issue":"6","key":"10631_CR9","doi-asserted-by":"publisher","first-page":"1834","DOI":"10.1109\/TSE.2020.3038881","volume":"48","author":"T Bi","year":"2020","unstructured":"Bi T, Xia X, Lo D, Grundy J, Zimmermann T (2020) An empirical study of release note production and usage in practice. IEEE Tran Softw Eng 48(6):1834\u20131852","journal-title":"IEEE Tran Softw Eng"},{"key":"10631_CR10","unstructured":"Bobrovskis S, Jurenoks A (2018) A survey of continuous integration, continuous delivery and continuos deployment. In BIR workshops, pp 314\u2013322"},{"key":"10631_CR11","unstructured":"Boslaugh S (2012) Statistics in a nutshell: A desktop quick reference. \u201cO\u2019Reilly Media, Inc.\u201d"},{"issue":"3","key":"10631_CR12","doi-asserted-by":"publisher","first-page":"294","DOI":"10.1177\/0049124113500475","volume":"42","author":"JL Campbell","year":"2013","unstructured":"Campbell JL, Quincy C, Osserman J, Pedersen OK (2013) Coding in-depth semistructured interviews: problems of unitization and intercoder reliability and agreement. Sociol Methods Res 42(3):294\u2013320","journal-title":"Sociol Methods Res"},{"key":"10631_CR13","doi-asserted-by":"crossref","unstructured":"Carvalho L, Seco JC (2021) Deep semantic versioning for evolution and variability. In Proceedings of the 23rd international symposium on principles and practice of declarative programming, pp 1\u201313","DOI":"10.1145\/3479394.3479416"},{"key":"10631_CR14","doi-asserted-by":"crossref","unstructured":"Casta\u00f1o J, Mart\u00ednez-Fern\u00e1ndez S, Franch X, Bogner J (2023) Exploring the carbon footprint of hugging face\u2019s ml models: a repository mining study. In 2023 ACM\/IEEE international symposium on empirical software engineering and measurement (ESEM), IEEE, pp 1\u201312","DOI":"10.1109\/ESEM56168.2023.10304801"},{"key":"10631_CR15","doi-asserted-by":"crossref","unstructured":"Casta\u00f1o J, Mart\u00ednez-Fern\u00e1ndez S, Franch X, Bogner J (2024) Analyzing the evolution and maintenance of ml models on hugging face. In 2024 IEEE\/ACM 21st international conference on mining software repositories (MSR), IEEE, pp 607\u2013618","DOI":"10.1145\/3643991.3644898"},{"issue":"2","key":"10631_CR16","doi-asserted-by":"publisher","first-page":"197","DOI":"10.1016\/j.jclinepi.2012.09.002","volume":"66","author":"K Cocks","year":"2013","unstructured":"Cocks K, Torgerson DJ (2013) Sample size calculations for pilot randomized trials: a confidence interval approach. J Clin Epidemiol 66(2):197\u2013201","journal-title":"J Clin Epidemiol"},{"key":"10631_CR17","doi-asserted-by":"crossref","unstructured":"Conneau A, Khandelwal K, Goyal N, Chaudhary V, Wenzek G, Guzm\u00e1n F, Grave E, Ott M, Zettlemoyer L, Stoyanov V (2019) Unsupervised cross-lingual representation learning at scale. arXiv preprint arXiv:1911.02116","DOI":"10.18653\/v1\/2020.acl-main.747"},{"key":"10631_CR18","doi-asserted-by":"crossref","unstructured":"Crisan A, Drouhard M, Vig J, Rajani N (2022) Interactive model cards: a human-centered approach to model documentation. In Proceedings of the 2022 ACM conference on fairness, accountability, and transparency, pp 427\u2013439","DOI":"10.1145\/3531146.3533108"},{"issue":"6","key":"10631_CR19","doi-asserted-by":"publisher","first-page":"1226","DOI":"10.1109\/TSE.2019.2918315","volume":"47","author":"A Decan","year":"2019","unstructured":"Decan A, Mens T (2019) What do package dependencies tell us about semantic versioning? IEEE Tran Softw Eng 47(6):1226\u20131240","journal-title":"IEEE Tran Softw Eng"},{"key":"10631_CR20","doi-asserted-by":"crossref","unstructured":"Decan A, Mens T, Claes M, Grosjean P (2016) When github meets cran: an analysis of inter-repository package dependency problems. In 2016 IEEE 23rd international conference on software analysis, evolution, and reengineering (SANER), vol 1. IEEE, pp 493\u2013504","DOI":"10.1109\/SANER.2016.12"},{"key":"10631_CR21","unstructured":"Dettmers T, Pagnoni A, Holtzman A, Zettlemoyer L (2024) Qlora: efficient finetuning of quantized llms. Adv Neural Inf Process Syst 36"},{"key":"10631_CR22","unstructured":"Devlin J, Chang MW, Lee K, Toutanova K (2018) Bert:Pre-training of deep bidirectional transformers for language understanding. arXiv preprint arXiv:1810.04805"},{"issue":"3","key":"10631_CR23","doi-asserted-by":"publisher","first-page":"220","DOI":"10.1038\/s42256-023-00626-4","volume":"5","author":"N Ding","year":"2023","unstructured":"Ding N, Qin Y, Yang G, Wei F, Yang Z, Su Y, Hu S, Chen Y, Chan CM, Chen W et al (2023) (2023) Parameter-efficient fine-tuning of large-scale pre-trained language models. Nat Mach Intell 5(3):220\u2013235","journal-title":"Nat Mach Intell"},{"key":"10631_CR24","doi-asserted-by":"crossref","unstructured":"Dom\u00ednguez-\u00c1lvarez D, Gorla A (2019) Release practices for ios and Android apps. In Proceedings of the 3rd ACM SIGSOFT international workshop on app market analytics, pp 15\u201318","DOI":"10.1145\/3340496.3342762"},{"key":"10631_CR25","unstructured":"Eldan R, Li Y (2023) Tinystories:How small can language models be and still speak coherent english? arXiv preprint arXiv:2305.07759"},{"key":"10631_CR26","doi-asserted-by":"crossref","unstructured":"Gong Y, Liu G, Xue Y, Li R, Meng L (2023) A survey on dataset quality in machine learning. Inf Softw Technol, pp 107268","DOI":"10.1016\/j.infsof.2023.107268"},{"key":"10631_CR27","doi-asserted-by":"crossref","unstructured":"Gresta R, Durelli V, Cirilo E (2021) Naming practices in java projects: an empirical study. In Proceedings of the XX Brazilian symposium on software quality, pp 1\u201310","DOI":"10.1145\/3493244.3493258"},{"key":"10631_CR28","first-page":"2790","volume-title":"Parameter-efficient transfer learning for nlp","author":"N Houlsby","year":"2019","unstructured":"Houlsby N, Giurgiu A, Jastrzebski S, Morrone B, De Laroussilhe Q, Gesmundo A, Attariyan M, Gelly S (2019) Parameter-efficient transfer learning for nlp. In International conference on machine learning, PMLR, pp 2790\u20132799"},{"key":"10631_CR29","doi-asserted-by":"crossref","unstructured":"Howard J, Ruder S (2018) Universal language model fine-tuning for text classification. arXiv preprint arXiv:1801.06146 2018","DOI":"10.18653\/v1\/P18-1031"},{"key":"10631_CR30","doi-asserted-by":"crossref","unstructured":"Jacob B, Kligys S, Chen B, Zhu M, Tang M, Howard A, Adam H, Kalenichenko D (2018) Quantization and training of neural networks for efficient integer-arithmetic-only inference. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp 2704\u20132713","DOI":"10.1109\/CVPR.2018.00286"},{"key":"10631_CR31","unstructured":"Jiang AQ, Sablayrolles A, Mensch A, Bamford C, Chaplot DS, de\u00a0las Casas D, Bressand F, Lengyel G, Lample G, Saulnier L et\u00a0al (2023a) Mistral 7b. arXiv preprint arXiv:2310.06825"},{"key":"10631_CR32","unstructured":"Jiang W, Cheung C, Kim M, Kim H, Thiruvathukal GK, Davis JC (2024a) Naming practices of pre-trained models in hugging face"},{"key":"10631_CR33","unstructured":"Jiang W, Cheung C, Thiruvathukal GK, Davis JC (2023b) Exploring naming conventions (and defects) of pre-trained deep learning models in hugging face and other model hubs. arXiv preprint arXiv:2310.01642"},{"key":"10631_CR34","doi-asserted-by":"crossref","unstructured":"Jiang W, Synovic N, Hyatt M, Schorlemmer TR, Sethi R, Lu YH, Thiruvathukal GK, Davis JC (2023c) An empirical study of pre-trained model reuse in the hugging face deep learning model registry. arXiv preprint arXiv:2303.02552","DOI":"10.1109\/ICSE48619.2023.00206"},{"key":"10631_CR35","doi-asserted-by":"crossref","unstructured":"Jiang W, Synovic N, Sethi R, Indarapu A, Hyatt M, Schorlemmer TR, Thiruvathukal GK, Davis JC (2022) An empirical study of artifacts and security risks in the pre-trained model supply chain. In Proceedings of the 2022 ACM workshop on software supply chain offensive research and ecosystem defenses, pp 105\u2013114","DOI":"10.1145\/3560835.3564547"},{"key":"10631_CR36","doi-asserted-by":"crossref","unstructured":"Jiang W, Yasmin J, Jones J, Synovic N, Kuo J, Bielanski N, Tian Y, Thiruvathukal GK, Davis JC (2024b) Peatmoss:A dataset and initial analysis of pre-trained models in open-source software. arXiv preprint arXiv:2402.00699","DOI":"10.1145\/3643991.3644907"},{"key":"10631_CR37","doi-asserted-by":"crossref","unstructured":"Jones J, Jiang W, Synovic N, Thiruvathukal G, Davis J (2024) What do we know about hugging face? a systematic literature review and quantitative validation of qualitative claims. In Proceedings of the 18th ACM\/IEEE international symposium on empirical software engineering and measurement, pp 13\u201324","DOI":"10.1145\/3674805.3686665"},{"key":"10631_CR38","first-page":"10697","volume-title":"Deduplicating training data mitigates privacy risks in language models","author":"N Kandpal","year":"2022","unstructured":"Kandpal N, Wallace E, Raffel C (2022) Deduplicating training data mitigates privacy risks in language models. In international conference on machine learning, PMLR, pp 10697\u201310707"},{"key":"#cr-split#-10631_CR39.1","unstructured":"Kathikar A, Nair A, Lazarine B, Sachdeva A, Samtani S (2023) Assessing the vulnerabilities of the open-source artificial intelligence"},{"key":"#cr-split#-10631_CR39.2","unstructured":"(ai) landscape: a large-scale analysis of the hugging face platform. In 2023 IEEE international conference on intelligence and security informatics (ISI), IEEE, pp 1-6"},{"key":"10631_CR40","doi-asserted-by":"crossref","unstructured":"Kerzazi N, Adams B (2016) Who needs release and devops engineers, and why? In Proceedings of the international workshop on continuous software evolution and delivery, pp 77\u201383","DOI":"10.1145\/2896941.2896957"},{"key":"10631_CR41","doi-asserted-by":"crossref","unstructured":"Khomh F, Dhaliwal T, Zou Y, Adams B (2012) Do faster releases improve software quality? an empirical case study of mozilla Firefox. In 2012 9th IEEE working conference on mining software repositories (MSR), IEEE, pp 179\u2013188","DOI":"10.1109\/MSR.2012.6224279"},{"key":"10631_CR42","doi-asserted-by":"crossref","unstructured":"Kinahan S, Saidi P, Daliri A, Liss J, Berisha V (2024) Achieving reproducibility in eeg-based machine learning. In The 2024 ACM conference on fairness, accountability, and transparency, pp 1464\u20131474","DOI":"10.1145\/3630106.3658983"},{"key":"10631_CR43","first-page":"2611","volume":"34","author":"HR Kirk","year":"2021","unstructured":"Kirk HR, Jun Y, Volpin F, Iqbal H, Benussi E, Dreyer F, Shtedritski A, Asano Y (2021) Bias out-of-the-box: An empirical analysis of intersectional occupational biases in popular generative language models. Adv Neural Inf Process Syst 34:2611\u20132624","journal-title":"Adv Neural Inf Process Syst"},{"key":"10631_CR44","doi-asserted-by":"crossref","unstructured":"Lam P, Dietrich J, Pearce DJ (2020) Putting the semantics into semantic versioning. In Proceedings of the 2020 ACM SIGPLAN international symposium on new ideas, new paradigms, and reflections on programming and software, pp 157\u2013179","DOI":"10.1145\/3426428.3426922"},{"key":"10631_CR45","doi-asserted-by":"publisher","first-page":"55","DOI":"10.1016\/j.infsof.2016.10.001","volume":"82","author":"E Laukkanen","year":"2017","unstructured":"Laukkanen E, Itkonen J, Lassenius C (2017) Problems, causes and solutions when adopting continuous delivery\u2014a systematic literature review. Inf Softw Technol 82:55\u201379","journal-title":"Inf Softw Technol"},{"key":"10631_CR46","doi-asserted-by":"publisher","first-page":"303","DOI":"10.1007\/s11334-007-0031-2","volume":"3","author":"D Lawrie","year":"2007","unstructured":"Lawrie D, Morrell C, Feild H, Binkley D (2007) Effective identifier names for comprehension and memory. Innov Syst Softw Eng 3:303\u2013318","journal-title":"Innov Syst Softw Eng"},{"key":"10631_CR47","first-page":"1950","volume":"35","author":"H Liu","year":"2022","unstructured":"Liu H, Tam D, Muqeeth M, Mohta J, Huang T, Bansal M, Raffel CA (2022) Few-shot parameter-efficient fine-tuning is better and cheaper than in-context learning. Adv Neural Inf Process Syst 35:1950\u20131965","journal-title":"Adv Neural Inf Process Syst"},{"key":"10631_CR48","doi-asserted-by":"crossref","unstructured":"Liu Y, Chen C, Zhang R, Qin T, Ji X, Lin H, Yang M (2020) Enhancing the interoperability between deep learning frameworks by model conversion. In Proceedings of the 28th ACM joint meeting on European software engineering conference and symposium on the foundations of software engineering, pp 1320\u20131330","DOI":"10.1145\/3368089.3417051"},{"key":"10631_CR49","unstructured":"Liu Y, Ott M, Goyal N, Du J, Joshi M, Chen D, Levy O, Lewis M, Zettlemoyer L, Stoyanov V (2019) Roberta: a robustly optimized bert pretraining approach. arXiv preprint arXiv:1907.11692"},{"key":"10631_CR50","doi-asserted-by":"crossref","unstructured":"Loomes MJ, Nehaniv CL, Wernick P (2005) The naming of systems and software evolvability. In IEEE international workshop on software evolvability (Software-Evolvability\u201905), IEEE, pp 23\u201328","DOI":"10.1109\/IWSE.2005.13"},{"key":"10631_CR51","unstructured":"Mao HH (2020) A survey on self-supervised pre-training for sequential transfer learning in neural networks. arXiv preprint arXiv:2007.00800"},{"key":"10631_CR52","unstructured":"Martin J. Fine-tuning and deployment. LinkedIn,. https:\/\/www.linkedin.com\/pulse\/fine-tuning-deployment-dr-john-martin-yvqyf"},{"key":"10631_CR53","doi-asserted-by":"crossref","unstructured":"Michlmayr M, Hunt F, Probert D (2007) Release management in free software projects: practices and problems. In open source development, adoption and innovation: IFIP working group 2.13 on open source software, June 11\u201314, 2007, Limerick, Ireland 3, Springer, pp 295\u2013300","DOI":"10.1007\/978-0-387-72486-7_31"},{"key":"10631_CR54","doi-asserted-by":"crossref","unstructured":"Min S, Seo M, Hajishirzi H (2017) Question answering through transfer learning from large fine-grained supervision data. arXiv preprint arXiv:1702.02171","DOI":"10.18653\/v1\/P17-2081"},{"key":"10631_CR55","doi-asserted-by":"crossref","unstructured":"Mitchell M, Wu S, Zaldivar A, Barnes P, Vasserman L, Hutchinson B, Spitzer E, Raji ID, Gebru T (2019) Model cards for model reporting. In Proceedings of the conference on fairness, accountability, and transparency, pp 220\u2013229","DOI":"10.1145\/3287560.3287596"},{"key":"10631_CR56","doi-asserted-by":"crossref","unstructured":"Nayebi M, Adams B, Ruhe G (2016) Release practices for mobile apps\u2013what do users and developers think? In 2016 ieee 23rd international conference on software analysis, evolution, and reengineering (saner), vol 1. IEEE, pp 552\u2013562","DOI":"10.1109\/SANER.2016.116"},{"key":"10631_CR57","doi-asserted-by":"crossref","unstructured":"Novakouski M, Lewis G, Anderson W, Davenport J (2012) Best practices for artifact versioning in service-oriented systems. Software Engineering Institute, Carnegie Mellon University, Pittsburgh, Pennsylvania, Technical Note CMU\/SEI-2011-TN-009","DOI":"10.21236\/ADA585496"},{"issue":"2","key":"10631_CR58","doi-asserted-by":"publisher","first-page":"2067","DOI":"10.1007\/s42001-024-00300-8","volume":"7","author":"C Osborne","year":"2024","unstructured":"Osborne C, Ding J, Kirk HR (2024) The ai community building the future? a quantitative analysis of development activity on hugging face hub. J Comput Soc Sci 7(2):2067\u20132105","journal-title":"J Comput Soc Sci"},{"key":"10631_CR59","doi-asserted-by":"crossref","unstructured":"Osborne C, Ding J, Kirk HR (2024) The ai community building the future? a quantitative analysis of development activity on hugging face hub. J Comput Soc Sci 7(2):2067\u20132105","DOI":"10.1007\/s42001-024-00300-8"},{"key":"10631_CR60","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa F, Varoquaux G, Gramfort A, Michel V, Thirion B, Grisel O, Blondel M, Prettenhofer P, Weiss R, Dubourg V et al (2011) Scikit-learn: Machine learning in python. J Mach Learn Res 12:2825\u20132830","journal-title":"J Mach Learn Res"},{"key":"10631_CR61","unstructured":"Pedregosa F, Varoquaux G, Gramfort A, Michel V, Thirion B, Grisel O, Blondel M, Prettenhofer P, Weiss R, Dubourg V et\u00a0al (2011) Scikit-learn:Machine learning in python. J Mach Learn Res 12:2825\u20132830"},{"key":"10631_CR62","doi-asserted-by":"publisher","DOI":"10.1016\/j.jss.2020.110657","volume":"168","author":"J P\u00e9rez","year":"2020","unstructured":"P\u00e9rez J, D\u00edaz J, Garcia-Martin J, Tabuenca B (2020) Systematic literature reviews in software engineering\u2014enhancement of the study selection process using cohen\u2019s kappa statistic. J Syst Softw 168:110657","journal-title":"J Syst Softw"},{"key":"10631_CR63","doi-asserted-by":"crossref","unstructured":"P\u00e9rez J, D\u00edaz J, Garcia-Martin J, Tabuenca B (2020) Systematic literature reviews in software engineering\u2014enhancement of the study selection process using cohen\u2019s kappa statistic. J Syst Softw 168:110657","DOI":"10.1016\/j.jss.2020.110657"},{"key":"10631_CR64","unstructured":"R\u00a0OpenAI. Gpt-4 technical report. View in Article 2:13. arxiv arXiv:2303.08774"},{"key":"10631_CR65","doi-asserted-by":"publisher","first-page":"140","DOI":"10.1016\/j.jss.2016.04.008","volume":"129","author":"S Raemaekers","year":"2017","unstructured":"Raemaekers S, van Deursen A, Visser J (2017) Semantic versioning and impact of breaking changes in the maven repository. J Syst Softw 129:140\u2013158","journal-title":"J Syst Softw"},{"key":"10631_CR66","doi-asserted-by":"crossref","unstructured":"Raemaekers S, van Deursen A, Visser J (2017) Semantic versioning and impact of breaking changes in the maven repository. J Syst Softw 129:140\u2013158","DOI":"10.1016\/j.jss.2016.04.008"},{"key":"10631_CR67","unstructured":"Saldana J (2015) The Coding Manual for Qualitative Researchers. Sage Publications"},{"key":"10631_CR68","volume-title":"The Coding Manual for Qualitative Researchers","author":"J Saldana","year":"2015","unstructured":"Saldana J (2015) The Coding Manual for Qualitative Researchers. Sage Publications"},{"key":"10631_CR69","doi-asserted-by":"publisher","DOI":"10.1016\/j.psychres.2021.114135","volume":"304","author":"J Sarzynska-Wawer","year":"2021","unstructured":"Sarzynska-Wawer J, Wawer A, Pawlak A, Szymanowska J, Stefaniak I, Jarkiewicz M, Okruszek L (2021) Detecting formal thought disorder by deep contextualized word representations. Psychiatry Res 304:114135","journal-title":"Psychiatry Res"},{"key":"10631_CR70","doi-asserted-by":"crossref","unstructured":"Seacord RC, Hissam SA, Wallnau KC (1998) Agora: a search engine for software components. IEEE Internet Comput 2 (6):62","DOI":"10.1109\/4236.735988"},{"issue":"6","key":"10631_CR71","doi-asserted-by":"publisher","first-page":"62","DOI":"10.1109\/4236.735988","volume":"2","author":"RC Seacord","year":"1998","unstructured":"Seacord RC, Hissam SA, Wallnau KC (1998) Agora: a search engine for software components. IEEE Internet Comput 2(6):62","journal-title":"IEEE Internet Comput"},{"key":"10631_CR72","doi-asserted-by":"publisher","first-page":"3909","DOI":"10.1109\/ACCESS.2017.2685629","volume":"5","author":"M Shahin","year":"2017","unstructured":"Shahin M, Babar MA, Zhu L (2017) Continuous integration, delivery and deployment:a systematic review on approaches, tools, challenges and practices. IEEE access 5:3909\u20133943","journal-title":"IEEE access"},{"key":"10631_CR73","doi-asserted-by":"crossref","unstructured":"Shahin M, Babar MA, Zhu L (2017) Continuous integration, delivery and deployment:a systematic review on approaches, tools, challenges and practices. IEEE access 5:3909\u20133943","DOI":"10.1109\/ACCESS.2017.2685629"},{"key":"10631_CR74","unstructured":"Singh AS, Masuku MB (2014) Sampling techniques & determination of sample size in applied statistics research:An overview. Int J Econ Commer Manag 2(11):1\u201322"},{"issue":"11","key":"10631_CR75","first-page":"1","volume":"2","author":"AS Singh","year":"2014","unstructured":"Singh AS, Masuku MB (2014) Sampling techniques & determination of sample size in applied statistics research: An overview. Int J Econ Commer Manag 2(11):1\u201322","journal-title":"Int J Econ Commer Manag"},{"key":"10631_CR76","doi-asserted-by":"crossref","unstructured":"Stuckenholz A (2005) Component evolution and versioning state of the art. ACM SIGSOFT Softw Eng Notes 30(1):7","DOI":"10.1145\/1039174.1039197"},{"issue":"1","key":"10631_CR77","doi-asserted-by":"publisher","first-page":"7","DOI":"10.1145\/1039174.1039197","volume":"30","author":"A Stuckenholz","year":"2005","unstructured":"Stuckenholz A (2005) Component evolution and versioning state of the art. ACM SIGSOFT Softw Eng Notes 30(1):7","journal-title":"ACM SIGSOFT Softw Eng Notes"},{"key":"10631_CR78","doi-asserted-by":"crossref","unstructured":"Sun S, Cheng Y, Gan Z, Liu J (2019) Patient knowledge distillation for bert model compression. arXiv preprint arXiv:1908.09355","DOI":"10.18653\/v1\/D19-1441"},{"key":"10631_CR79","doi-asserted-by":"crossref","unstructured":"Taraghi M, Dorcelus G, Foundjem A, Tambon F, Khomh F (2024) Deep learning model reuse in the huggingface community: challenges, benefit and trends. arXiv preprint arXiv:2401.13177","DOI":"10.1109\/SANER60148.2024.00059"},{"key":"10631_CR80","unstructured":"Team G, Mesnard T, Hardin C, Dadashi R, Bhupatiraju S, Pathak S, Sifre L, Rivi\u00e8re M, Kale MS, Love J et\u00a0al (2024) Gemma: open models based on gemini research and technology. arXiv preprint arXiv:2403.08295"},{"key":"10631_CR81","doi-asserted-by":"crossref","unstructured":"Toma TR, Bezemer CP (2024) An exploratory study of dataset and model management in open source machine learning applications","DOI":"10.1145\/3644815.3644963"},{"key":"10631_CR82","unstructured":"Touvron H, Lavril T, Izacard G, Martinet X, Lachaux MA, Lacroix T, Rozi\u00e8re B, Goyal N, Hambro E, Azhar F et\u00a0al (2023) Llama:Open and efficient foundation language models. arXiv preprint arXiv:2302.13971"},{"key":"10631_CR83","doi-asserted-by":"crossref","unstructured":"Turri V, Morrison K, Robinson KM, Abidi C, Perer A, Forlizzi J, Dzombak R (2024) Transparency in the wild:Navigating transparency in a deployed ai system to broaden need-finding approaches. In The 2024 ACM conference on fairness, accountability, and transparency, pp 1494\u20131514","DOI":"10.1145\/3630106.3658985"},{"key":"10631_CR84","first-page":"1","volume-title":"Cohen\u2019s kappa coefficient as a performance measure for feature selection","author":"SM Vieira","year":"2010","unstructured":"Vieira SM, Kaymak U, Sousa JMC (2010) Cohen\u2019s kappa coefficient as a performance measure for feature selection. In International conference on fuzzy systems, IEEE, pp 1\u20138"},{"key":"10631_CR85","doi-asserted-by":"crossref","unstructured":"Wadhwani A, Jain P (2020) Machine learning model cards transparency review: using model card toolkit. In 2020 IEEE pune section international conference (PuneCon), IEEE, pp 133\u2013137","DOI":"10.1109\/PuneCon50868.2020.9362382"},{"key":"10631_CR86","doi-asserted-by":"crossref","unstructured":"Wang H, Li J, Wu H, Hovy E, Sun Y (2022) Pre-trained language models and their applications. Eng","DOI":"10.1016\/j.eng.2022.04.024"},{"key":"10631_CR87","doi-asserted-by":"crossref","unstructured":"Williams LL, Quave K (2019) Chapter 10\u2013tests of proportions:chi-square, likelihood ratio, fisher\u2019s exact test. Quantitative anthropology, pp 123\u201341","DOI":"10.1016\/B978-0-12-812775-9.00010-4"},{"issue":"1","key":"10631_CR88","first-page":"1","volume":"4","author":"JR Wood","year":"2008","unstructured":"Wood JR, Wood LE (2008) Card sorting:current practices and beyond. J Usability Stud 4(1):1\u20136","journal-title":"J Usability Stud"},{"key":"10631_CR89","doi-asserted-by":"crossref","unstructured":"Wortsman M, Ilharco G, Kim JW, Li M, Kornblith S, Roelofs R, Lopes RG, Hajishirzi H, Farhadi A, Namkoong H et\u00a0al (2022) Robust fine-tuning of zero-shot models. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 7959\u20137971","DOI":"10.1109\/CVPR52688.2022.00780"},{"key":"10631_CR90","doi-asserted-by":"crossref","unstructured":"Xia B, Bi T, Xing Z, Lu Q, Zhu L (2023) An empirical study on software bill of materials:Where we stand and the road ahead. In 2023 IEEE\/ACM 45th international conference on software engineering (ICSE), IEEE, pp 2630\u20132642","DOI":"10.1109\/ICSE48619.2023.00219"},{"issue":"1","key":"10631_CR91","doi-asserted-by":"publisher","first-page":"114","DOI":"10.1109\/MS.2020.2975159","volume":"38","author":"M Xiu","year":"2023","unstructured":"Xiu M, Jiang ZMJ, Adams B (2023) An exploratory study of machine learning model stores. IEEE Softw 38(1):114\u2013122","journal-title":"IEEE Softw"},{"issue":"4","key":"10631_CR92","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/2791577","volume":"47","author":"T Xu","year":"2015","unstructured":"Xu T, Zhou Y (2015) Systems approaches to tackling configuration errors: a survey. ACM Comput Surv (CSUR) 47(4):1\u201341","journal-title":"ACM Comput Surv (CSUR)"},{"key":"10631_CR93","doi-asserted-by":"publisher","first-page":"106397","DOI":"10.1016\/j.infsof.2020.106397","volume":"130","author":"L Yang","year":"2021","unstructured":"Yang L, Zhang H, Shen H, Huang X, Zhou X, Rong G, Shao D (2021) Quality assessment in systematic literature reviews: a software engineering perspective. Inf Softw Technol 130:106397","journal-title":"Inf Softw Technol"},{"key":"10631_CR94","doi-asserted-by":"crossref","unstructured":"Yang Z, Shi J, Lo D (2024) Ecosystem of large language models for code. arXiv preprint arXiv:2405.16746","DOI":"10.1145\/3731753"},{"key":"10631_CR95","doi-asserted-by":"crossref","unstructured":"Yin Z, Ma X, Zheng J, Zhou Y, Bairavasundaram LN, Pasupathy S (2011) An empirical study on configuration errors in commercial and open source systems. In Proceedings of the 23rd ACM symposium on operating systems principles, pp 159\u2013172","DOI":"10.1145\/2043556.2043572"},{"key":"10631_CR96","unstructured":"Zhao WX, Zhou K, Li J, Tang T, Wang X, Hou Y, Min Y, Zhang B, Zhang J, Dong Z et\u00a0al (2023) A survey of large language models. arXiv preprint arXiv:2303.18223"},{"key":"10631_CR97","unstructured":"Zhu M, Gupta S (2017) To prune, or not to prune:exploring the efficacy of pruning for model compression. arXiv preprint arXiv:1710.01878"}],"container-title":["Empirical Software Engineering"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10664-025-10631-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10664-025-10631-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10664-025-10631-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,20]],"date-time":"2025-11-20T13:28:06Z","timestamp":1763645286000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10664-025-10631-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,3,6]]},"references-count":98,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2025,5]]}},"alternative-id":["10631"],"URL":"https:\/\/doi.org\/10.1007\/s10664-025-10631-3","relation":{},"ISSN":["1382-3256","1573-7616"],"issn-type":[{"value":"1382-3256","type":"print"},{"value":"1573-7616","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,3,6]]},"assertion":[{"value":"17 February 2025","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"6 March 2025","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing interests or personal relationships that could have (appeared to) influenced the work reported in this article.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflicts of Interests\/Competing Interests"}},{"value":"This study does not involve human participants or animals.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical Approval"}},{"value":"No human subjects were involved in this study.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Informed Consent"}}],"article-number":"78"}}