{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,16]],"date-time":"2025-09-16T18:45:20Z","timestamp":1758048320820,"version":"3.44.0"},"reference-count":29,"publisher":"Springer Science and Business Media LLC","issue":"5","license":[{"start":{"date-parts":[[2025,8,1]],"date-time":"2025-08-01T00:00:00Z","timestamp":1754006400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,8,1]],"date-time":"2025-08-01T00:00:00Z","timestamp":1754006400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100021856","name":"Ministero dell\u2019Universit\u00e0 e della Ricerca","doi-asserted-by":"publisher","award":["P2022SELA7"],"award-info":[{"award-number":["P2022SELA7"]}],"id":[{"id":"10.13039\/501100021856","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Empir Software Eng"],"published-print":{"date-parts":[[2025,9]]},"DOI":"10.1007\/s10664-025-10680-8","type":"journal-article","created":{"date-parts":[[2025,8,1]],"date-time":"2025-08-01T12:13:20Z","timestamp":1754050400000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Mining and measuring the impact of change patterns for improving the size and build time of docker images"],"prefix":"10.1007","volume":"30","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-5241-1608","authenticated-orcid":false,"given":"Giovanni","family":"Rosa","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5443-1303","authenticated-orcid":false,"given":"Emanuela","family":"Guglielmi","sequence":"additional","affiliation":[]},{"given":"Mattia","family":"Iannone","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1764-9685","authenticated-orcid":false,"given":"Simone","family":"Scalabrino","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7995-8582","authenticated-orcid":false,"given":"Rocco","family":"Oliveto","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,8,1]]},"reference":[{"issue":"2","key":"10680_CR1","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s10664-021-10081-7","volume":"27","author":"H Azuma","year":"2022","unstructured":"Azuma H, Matsumoto S, Kamei Y, Kusumoto S (2022) An empirical study on self-admitted technical debt in dockerfiles. Empir Softw Eng 27(2):1\u201326","journal-title":"Empir Softw Eng"},{"issue":"3","key":"10680_CR2","doi-asserted-by":"publisher","first-page":"81","DOI":"10.1109\/MCC.2014.51","volume":"1","author":"D Bernstein","year":"2014","unstructured":"Bernstein D (2014) Containers and cloud: from lxc to docker to kubernetes. IEEE Cloud Comput 1(3):81\u201384","journal-title":"IEEE Cloud Comput"},{"key":"10680_CR3","doi-asserted-by":"crossref","unstructured":"Bui QC, Lauk\u00f6tter M, Scandariato R (2023) Dockercleaner: Automatic repair of security smells in dockerfiles. In: 2023 IEEE International Conference on Software Maintenance and Evolution (ICSME), p To Appear. IEEE","DOI":"10.1109\/ICSME58846.2023.00026"},{"key":"10680_CR4","doi-asserted-by":"crossref","unstructured":"Cito J, Schermann G, Wittern JE, Leitner P, Zumberi S, Gall HC (2017) An empirical analysis of the docker container ecosystem on github. In: 2017 IEEE\/ACM 14th International Conference on Mining Software Repositories (MSR), pp 323\u2013333. IEEE","DOI":"10.1109\/MSR.2017.67"},{"key":"10680_CR5","doi-asserted-by":"crossref","unstructured":"Durieux T (2024) Empirical study of the docker smells impact on the image size pp 1\u201312","DOI":"10.1145\/3597503.3639143"},{"key":"10680_CR6","doi-asserted-by":"crossref","unstructured":"Eng K, Hindle A (2021) Revisiting dockerfiles in open source software over time. In: 2021 IEEE\/ACM 18th International Conference on Mining Software Repositories (MSR), pp 449\u2013459. IEEE","DOI":"10.1109\/MSR52588.2021.00057"},{"key":"10680_CR7","unstructured":"hadolint (2015) Dockerfile linter, validate inline bash, written in haskell. https:\/\/github.com\/hadolint\/hadolint. [Online; Accessed 2 Jun 2022]"},{"key":"10680_CR8","doi-asserted-by":"crossref","unstructured":"Henkel J, Bird C, Lahiri SK, Reps T (2020) A dataset of Dockerfiles. In: Proceedings of the 17th international conference on mining software repositories, pp 528\u2013532","DOI":"10.1145\/3379597.3387498"},{"key":"10680_CR9","doi-asserted-by":"crossref","unstructured":"Henkel J, Bird C, Lahiri SK, Reps T (2020) Learning from, understanding, and supporting devops artifacts for docker. In: 2020 IEEE\/ACM 42nd International Conference on Software Engineering (ICSE), pp 38\u201349. IEEE","DOI":"10.1145\/3377811.3380406"},{"key":"10680_CR10","doi-asserted-by":"crossref","unstructured":"Henkel J, Silva D, Teixeira L, d\u2019Amorim M, Reps T (2021) Shipwright: a human-in-the-loop system for dockerfile repair. In: 2021 IEEE\/ACM 43rd International Conference on Software Engineering (ICSE), pp 1148\u20131160. IEEE","DOI":"10.1109\/ICSE43902.2021.00106"},{"key":"10680_CR11","doi-asserted-by":"crossref","unstructured":"Jiang Q (2022) Improving performance of docker instance via image reconstruction. In: International conference on big data intelligence and computing, pp 511\u2013522. Springer","DOI":"10.1007\/978-981-99-2233-8_37"},{"key":"10680_CR12","doi-asserted-by":"crossref","unstructured":"Kitajima S, Sekiguchi A (2020) Latest image recommendation method for automatic base image update in dockerfile. In: International conference on service-oriented computing, pp 547\u2013562. Springer","DOI":"10.1007\/978-3-030-65310-1_40"},{"key":"10680_CR13","doi-asserted-by":"crossref","unstructured":"Ksontini E, Kessentini M, Ferreira TdN, Hassan F (2021) Refactorings and technical debt in docker projects: an empirical study. In: 2021 36th IEEE\/ACM International Conference on Automated Software Engineering (ASE), pp 781\u2013791. IEEE","DOI":"10.1109\/ASE51524.2021.9678585"},{"key":"10680_CR14","doi-asserted-by":"crossref","unstructured":"Landis JR, Koch GG (1977) An application of hierarchical kappa-type statistics in the assessment of majority agreement among multiple observers. Biometrics 363\u2013374","DOI":"10.2307\/2529786"},{"key":"10680_CR15","doi-asserted-by":"crossref","unstructured":"Lin C, Nadi S, Khazaei H (2020) A large-scale data set and an empirical study of docker images hosted on docker hub. In: 2020 IEEE International Conference on Software Maintenance and Evolution (ICSME), pp 371\u2013381. IEEE","DOI":"10.1109\/ICSME46990.2020.00043"},{"issue":"2","key":"10680_CR16","doi-asserted-by":"publisher","first-page":"545","DOI":"10.11144\/Javeriana.upsy10-2.cdcp","volume":"10","author":"G Macbeth","year":"2011","unstructured":"Macbeth G, Razumiejczyk E, Ledesma RD (2011) Cliff\u2019s delta calculator: a non-parametric effect size program for two groups of observations. Univ Psychol 10(2):545\u2013555","journal-title":"Univ Psychol"},{"key":"10680_CR17","doi-asserted-by":"crossref","unstructured":"Rastogi V, Davidson D, De\u00a0Carli L, Jha S, McDaniel P (2017a) Cimplifier: automatically debloating containers. In: Proceedings of the 2017 11th joint meeting on foundations of software engineering, pp 476\u2013486","DOI":"10.1145\/3106237.3106271"},{"key":"10680_CR18","doi-asserted-by":"crossref","unstructured":"Rastogi V, Niddodi C, Mohan S, Jha S (2017b) New directions for container debloating. In: Proceedings of the 2017 workshop on forming an ecosystem around software transformation, pp 51\u201356","DOI":"10.1145\/3141235.3141241"},{"key":"10680_CR19","doi-asserted-by":"publisher","unstructured":"Rosa G, Guglielmi E, Iannone M, Scalabrino S, Oliveto R (2024) Replication package for \u201cmining and measuring the impact of change patterns for improving the size and build time of docker images\u201d. https:\/\/doi.org\/10.6084\/m9.figshare.24579580","DOI":"10.6084\/m9.figshare.24579580"},{"key":"10680_CR20","doi-asserted-by":"crossref","unstructured":"Rosa G, Scalabrino S, Bavota G, Oliveto R (2023) What quality aspects influence the adoption of docker images? ACM Trans Softw Eng Methodol","DOI":"10.1145\/3603111"},{"issue":"5","key":"10680_CR21","doi-asserted-by":"publisher","first-page":"108","DOI":"10.1007\/s10664-024-10471-7","volume":"29","author":"G Rosa","year":"2024","unstructured":"Rosa G, Zappone F, Scalabrino S, Oliveto R (2024) Fixing dockerfile smells: an empirical study. Empir Softw Eng 29(5):108","journal-title":"Empir Softw Eng"},{"key":"10680_CR22","unstructured":"Skourtis D, Rupprecht L, Tarasov V, Megiddo N (2019) Carving perfect layers out of docker images. In: 11th USENIX Workshop on Hot Topics in Cloud Computing (HotCloud 19)"},{"key":"10680_CR23","unstructured":"Spencer D (2009) Card sorting: designing usable categories. Rosenfeld Media"},{"key":"10680_CR24","doi-asserted-by":"crossref","unstructured":"Woolson RF (2007) Wilcoxon signed-rank test. Wiley encyclopedia of clinical trials, pp 1\u20133","DOI":"10.1002\/9780471462422.eoct979"},{"key":"10680_CR25","doi-asserted-by":"publisher","first-page":"34127","DOI":"10.1109\/ACCESS.2020.2973750","volume":"8","author":"Y Wu","year":"2020","unstructured":"Wu Y, Zhang Y, Wang T, Wang H (2020) Characterizing the occurrence of dockerfile smells in open-source software: an empirical study. IEEE Access 8:34127\u201334139","journal-title":"IEEE Access"},{"issue":"2","key":"10680_CR26","doi-asserted-by":"publisher","first-page":"19","DOI":"10.1007\/s10664-020-09908-6","volume":"26","author":"A Zerouali","year":"2021","unstructured":"Zerouali A, Mens T, Decan A, Gonzalez-Barahona J, Robles G (2021) A multi-dimensional analysis of technical lag in Debian-based docker images. Empir Softw Eng 26(2):19","journal-title":"Empir Softw Eng"},{"key":"10680_CR27","doi-asserted-by":"crossref","unstructured":"Zhang Y, Vasilescu B, Wang H, Filkov V (2018) One size does not fit all: an empirical study of containerized continuous deployment workflows. In: Proceedings of the 2018 26th ACM joint meeting on European software engineering conference and symposium on the foundations of software engineering, pp 295\u2013306","DOI":"10.1145\/3236024.3236033"},{"key":"10680_CR28","doi-asserted-by":"crossref","unstructured":"Zhang Y, Zhang Y, Mao X, Wu Y, Lin B, Wang S (2022) Recommending base image for docker containers based on deep configuration comprehension. In: 2022 IEEE International Conference on Software Analysis, Evolution and Reengineering (SANER), pp 449\u2013453. IEEE","DOI":"10.1109\/SANER53432.2022.00060"},{"key":"10680_CR29","doi-asserted-by":"crossref","unstructured":"Zhou Y, Zhan W, Li Z, Han T, Chen T, Gall H (2022) Drive: Dockerfile rule mining and violation detection. arXiv:2212.05648","DOI":"10.1145\/3617173"}],"container-title":["Empirical Software Engineering"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10664-025-10680-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10664-025-10680-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10664-025-10680-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,13]],"date-time":"2025-09-13T08:55:26Z","timestamp":1757753726000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10664-025-10680-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,8,1]]},"references-count":29,"journal-issue":{"issue":"5","published-print":{"date-parts":[[2025,9]]}},"alternative-id":["10680"],"URL":"https:\/\/doi.org\/10.1007\/s10664-025-10680-8","relation":{},"ISSN":["1382-3256","1573-7616"],"issn-type":[{"type":"print","value":"1382-3256"},{"type":"electronic","value":"1573-7616"}],"subject":[],"published":{"date-parts":[[2025,8,1]]},"assertion":[{"value":"27 May 2025","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"1 August 2025","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of Interest"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical Approval"}},{"value":"Not applicable.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Informed Consent"}},{"value":"Not applicable.","order":5,"name":"Ethics","group":{"name":"EthicsHeading","label":"Clinical Trial Number"}}],"article-number":"150"}}