{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:23:41Z","timestamp":1750220621153,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":19,"publisher":"ACM","license":[{"start":{"date-parts":[[2020,11,13]],"date-time":"2020-11-13T00:00:00Z","timestamp":1605225600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2020,11,13]]},"DOI":"10.1145\/3416505.3423562","type":"proceedings-article","created":{"date-parts":[[2020,11,6]],"date-time":"2020-11-06T23:01:37Z","timestamp":1604703697000},"page":"13-18","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Speeding up the data extraction of machine learning approaches: a distributed framework"],"prefix":"10.1145","author":[{"given":"Martin","family":"Steinhauer","sequence":"first","affiliation":[{"name":"University of Salerno, Italy"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Fabio","family":"Palomba","sequence":"additional","affiliation":[{"name":"University of Salerno, Italy"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2020,11,13]]},"reference":[{"unstructured":"Apache Parquet.  Apache Parquet.","key":"e_1_3_2_1_1_1"},{"unstructured":"Getting connection refused \u00b7 Issue #171 \u00b7 src-d\/datasets. https:\/\/github.com\/srcd\/datasets\/issues\/171.  Getting connection refused \u00b7 Issue #171 \u00b7 src-d\/datasets. https:\/\/github.com\/srcd\/datasets\/issues\/171.","key":"e_1_3_2_1_2_1"},{"unstructured":"GraphX-Spark 2.4.6 Documentation. https:\/\/spark.apache.org\/docs\/latest\/graphxprogramming-guide.html.  GraphX-Spark 2.4.6 Documentation. https:\/\/spark.apache.org\/docs\/latest\/graphxprogramming-guide.html.","key":"e_1_3_2_1_3_1"},{"unstructured":"ishepard\/pydriller: Python Framework to analyse Git repositories. https:\/\/github.com\/ishepard\/pydriller.  ishepard\/pydriller: Python Framework to analyse Git repositories. https:\/\/github.com\/ishepard\/pydriller.","key":"e_1_3_2_1_4_1"},{"unstructured":"JGit | The Eclipse Foundation. https:\/\/www.eclipse.org\/jgit\/.  JGit | The Eclipse Foundation. https:\/\/www.eclipse.org\/jgit\/.","key":"e_1_3_2_1_5_1"},{"unstructured":"mauricioaniche\/repodriller: a tool to support researchers on mining software repositories studies.  mauricioaniche\/repodriller: a tool to support researchers on mining software repositories studies.","key":"e_1_3_2_1_6_1"},{"unstructured":"Neo4j Graph Platform-The Leader in Graph Databases. https:\/\/github.com\/neo4j\/neo4j.  Neo4j Graph Platform-The Leader in Graph Databases. https:\/\/github.com\/neo4j\/neo4j.","key":"e_1_3_2_1_7_1"},{"key":"e_1_3_2_1_8_1","volume-title":"Java code metrics calculator (ck )","author":"Aniche M.","year":"2015","unstructured":"M. Aniche . Java code metrics calculator (ck ) , 2015 . Available in https:\/\/github.com\/mauricioaniche\/ck\/. M. Aniche. Java code metrics calculator (ck ), 2015. Available in https:\/\/github.com\/mauricioaniche\/ck\/."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_9_1","DOI":"10.1145\/3305160.3305173"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_10_1","DOI":"10.1145\/1327452.1327492"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_11_1","DOI":"10.1109\/MSR.2019.00070"},{"key":"e_1_3_2_1_12_1","volume-title":"The GHTorent dataset and tool suite The GHTorent Dataset and Tool Suite. (June)","author":"Gousios G.","year":"2015","unstructured":"G. Gousios . The GHTorent dataset and tool suite The GHTorent Dataset and Tool Suite. (June) , 2015 . G. Gousios. The GHTorent dataset and tool suite The GHTorent Dataset and Tool Suite. (June), 2015."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_13_1","DOI":"10.5555\/2664446.2664449"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_14_1","DOI":"10.1145\/1773912.1773922"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_15_1","DOI":"10.1145\/3196398.3196464"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_16_1","DOI":"10.1109\/MSR.2010.5463348"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_17_1","DOI":"10.1109\/MSST.2010.5496972"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_18_1","DOI":"10.1145\/3236024.3264598"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_19_1","DOI":"10.1145\/3180155.3180206"}],"event":{"sponsor":["SIGSOFT ACM Special Interest Group on Software Engineering"],"acronym":"ESEC\/FSE '20","name":"ESEC\/FSE '20: 28th ACM Joint European Software Engineering Conference and Symposium on the Foundations of Software Engineering","location":"Virtual USA"},"container-title":["Proceedings of the 4th ACM SIGSOFT International Workshop on Machine-Learning Techniques for Software-Quality Evaluation"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3416505.3423562","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3416505.3423562","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T22:01:21Z","timestamp":1750197681000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3416505.3423562"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,11,13]]},"references-count":19,"alternative-id":["10.1145\/3416505.3423562","10.1145\/3416505"],"URL":"https:\/\/doi.org\/10.1145\/3416505.3423562","relation":{},"subject":[],"published":{"date-parts":[[2020,11,13]]},"assertion":[{"value":"2020-11-13","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}