{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:12:57Z","timestamp":1750219977189,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":25,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,6,27]],"date-time":"2023-06-27T00:00:00Z","timestamp":1687824000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,6,27]]},"DOI":"10.1145\/3589806.3600043","type":"proceedings-article","created":{"date-parts":[[2023,6,28]],"date-time":"2023-06-28T20:09:22Z","timestamp":1687982962000},"page":"27-36","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":2,"title":["Fingerprinting and Building Large Reproducible Datasets"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0008-2019-1058","authenticated-orcid":false,"given":"Romain","family":"Lefeuvre","sequence":"first","affiliation":[{"name":"Inria, University of Rennes, France"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9868-1814","authenticated-orcid":false,"given":"Jessie","family":"Galasso","sequence":"additional","affiliation":[{"name":"Department of Computer Science and Operations Research, DIRO, Universit\u00e9 de Montr\u00e9al, Canada"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7104-7848","authenticated-orcid":false,"given":"Benoit","family":"Combemale","sequence":"additional","affiliation":[{"name":"Computer Science Department, University of Rennes, IRISA &amp; Inria, France"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6304-9926","authenticated-orcid":false,"given":"Houari","family":"Sahraoui","sequence":"additional","affiliation":[{"name":"Department of Computer Science and Operations Research, DIRO, Universit\u00e9 de Montr\u00e9al, Canada"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4576-136X","authenticated-orcid":false,"given":"Stefano","family":"Zacchiroli","sequence":"additional","affiliation":[{"name":"LTCI, T\u00e9l\u00e9com Paris, Institut Polytechnique de Paris, France"}]}],"member":"320","published-online":{"date-parts":[[2023,6,28]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1145\/2901739.2903508"},{"key":"e_1_3_2_1_2_1","volume-title":"Terminologies for reproducible research. arXiv preprint arXiv:1802.03311","author":"Barba A","year":"2018","unstructured":"Lorena\u00a0A Barba. 2018. Terminologies for reproducible research. arXiv preprint arXiv:1802.03311 (2018)."},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1109\/SANER48275.2020.9054827"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-30982-3_3"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1145\/2901739.2901776"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/MCSE.2019.2963148"},{"key":"e_1_3_2_1_7_1","first-page":"501","article-title":"Replication of empirical studies in software engineering research: a systematic mapping study","volume":"19","author":"Da\u00a0Silva QB","year":"2014","unstructured":"Fabio\u00a0QB Da\u00a0Silva, Marcos Suassuna, A\u00a0C\u00e9sar\u00a0C Fran\u00e7a, Alicia\u00a0M Grubb, Tatiana\u00a0B Gouveia, Cleviton\u00a0VF Monteiro, and Igor\u00a0Ebrahim dos Santos. 2014. Replication of empirical studies in software engineering research: a systematic mapping study. Empirical Software Engineering 19, 3 (2014), 501\u2013557.","journal-title":"Empirical Software Engineering"},{"key":"e_1_3_2_1_8_1","volume-title":"Software heritage: Why and how to preserve software source code. In iPRES","author":"Di\u00a0Cosmo Roberto","year":"2017","unstructured":"Roberto Di\u00a0Cosmo and Stefano Zacchiroli. 2017. Software heritage: Why and how to preserve software source code. In iPRES 2017. 1\u201310."},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1145\/2803171"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1145\/3183713.3190657"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1145\/3196398.3196460"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.5555\/2487085.2487132"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/3178876.3186014"},{"volume-title":"LASER Summer School","author":"Juristo Natalia","key":"e_1_3_2_1_14_1","unstructured":"Natalia Juristo and Omar\u00a0S G\u00f3mez. 2012. Replication of software engineering experiments. In LASER Summer School. Springer, 60\u201388."},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10664-015-9393-5"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/3379597.3387503"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.dss.2018.10.007"},{"key":"e_1_3_2_1_18_1","unstructured":"Antoine Pietri. 2021. Organizing the graph of public software development for large-scale mining. Theses. Universit\u00e9 Paris Cit\u00e9. https:\/\/hal.science\/tel-03515795"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1109\/MSR.2019.00030"},{"key":"e_1_3_2_1_20_1","volume-title":"The role of replications in empirical software engineering. Empirical software engineering 13, 2","author":"Shull J","year":"2008","unstructured":"Forrest\u00a0J Shull, Jeffrey\u00a0C Carver, Sira Vegas, and Natalia Juristo. 2008. The role of replications in empirical software engineering. Empirical software engineering 13, 2 (2008), 211\u2013218."},{"key":"e_1_3_2_1_21_1","volume-title":"Methodologies, Reproducibility, and Tools. arXiv preprint arXiv:2204.08108","author":"Tutko Adam","year":"2022","unstructured":"Adam Tutko, Austin\u00a0Z Henley, and Audris Mockus. 2022. How are Software Repositories Mined? A Systematic Literature Review of Workflows, Methodologies, Reproducibility, and Tools. arXiv preprint arXiv:2204.08108 (2022)."},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.dss.2019.113133"},{"key":"e_1_3_2_1_23_1","first-page":"106791","article-title":"A systematic process for Mining Software Repositories: Results from a systematic literature review","volume":"144","author":"Vidoni M","year":"2022","unstructured":"M Vidoni. 2022. A systematic process for Mining Software Repositories: Results from a systematic literature review. IST 144 (2022), 106791.","journal-title":"IST"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.jss.2021.111009"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11390-018-1864-x"}],"event":{"name":"ACM REP '23: 2023 ACM Conference on Reproducibility and Replicability","sponsor":["EIGREP Emerging Interest Group on Reproducibility and Replicability"],"location":"Santa Cruz CA USA","acronym":"ACM REP '23"},"container-title":["Proceedings of the 2023 ACM Conference on Reproducibility and Replicability"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3589806.3600043","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3589806.3600043","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T17:49:22Z","timestamp":1750182562000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3589806.3600043"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,6,27]]},"references-count":25,"alternative-id":["10.1145\/3589806.3600043","10.1145\/3589806"],"URL":"https:\/\/doi.org\/10.1145\/3589806.3600043","relation":{},"subject":[],"published":{"date-parts":[[2023,6,27]]},"assertion":[{"value":"2023-06-28","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}