{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,29]],"date-time":"2024-10-29T11:11:33Z","timestamp":1730200293188,"version":"3.28.0"},"reference-count":27,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,12,15]],"date-time":"2023-12-15T00:00:00Z","timestamp":1702598400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,12,15]],"date-time":"2023-12-15T00:00:00Z","timestamp":1702598400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,12,15]]},"DOI":"10.1109\/bigdata59044.2023.10386531","type":"proceedings-article","created":{"date-parts":[[2024,1,22]],"date-time":"2024-01-22T18:28:47Z","timestamp":1705948127000},"page":"1581-1590","source":"Crossref","is-referenced-by-count":0,"title":["Refactoring ETL Flows in The Wild"],"prefix":"10.1109","author":[{"given":"Dolev","family":"Adas","sequence":"first","affiliation":[{"name":"IBM Research,Israel"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ohad","family":"Eytan","sequence":"additional","affiliation":[{"name":"IBM Research,Israel"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Guy","family":"Khazma","sequence":"additional","affiliation":[{"name":"University of Toronto at Ontario,Department of Computer Science,Canada"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Josep","family":"Samp\u00e9","sequence":"additional","affiliation":[{"name":"IBM Research,Israel"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Paula","family":"Ta-Shma","sequence":"additional","affiliation":[{"name":"IBM Research,Israel"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"volume-title":"The History, Present, and Future of ETL Technology","year":"2023","author":"Simitsis","key":"ref1"},{"volume-title":"Global ETL Software Market Insights","key":"ref2"},{"volume-title":"IBM DataStage\u2122","key":"ref3"},{"volume-title":"DAG (DBT Documentation)","key":"ref4"},{"volume-title":"DAGs (Airflow Documentation)","key":"ref5"},{"volume-title":"DAG (DVC Documentation","key":"ref6"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICDM.2002.1184038"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1145\/1651291.1651297"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1016\/j.datak.2017.08.004"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2004.33"},{"key":"ref11","article-title":"An improved algorithm for matching large graphs","volume-title":"Proc. of the 3rd IAPR-TC-15 International Workshop on Graph-based Representations","volume":"57","author":"Sansone"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.14778\/2733004.2733009"},{"volume-title":"Technical notes on extending gSpan to directed graphs","year":"2010","author":"Leung","key":"ref13"},{"volume-title":"betterenvi\/gSpan: a Python implementation of gSpan","author":"Chen","key":"ref14"},{"volume-title":"TonyZZX\/gSpan.Java: a Java implementation of gSpan","author":"Zhu","key":"ref15"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/BigData52589.2021.9671995"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1145\/1368088.1368172"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1145\/1808901.1808909"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1007\/s11219-015-9296-0"},{"volume-title":"IBM Subflows in DataStage","key":"ref20"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1017\/s0269888912000331"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1155\/2014\/869198"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/3381449"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1007\/s10796-020-09995-2"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/SP.1980.10006"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1145\/956750.956784"},{"volume-title":"Releasing Anonymized ETL Flow Datasets for FSM","year":"2023","author":"Eytan","key":"ref27"}],"event":{"name":"2023 IEEE International Conference on Big Data (BigData)","start":{"date-parts":[[2023,12,15]]},"location":"Sorrento, Italy","end":{"date-parts":[[2023,12,18]]}},"container-title":["2023 IEEE International Conference on Big Data (BigData)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10385234\/10386078\/10386531.pdf?arnumber=10386531","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,2,1]],"date-time":"2024-02-01T02:12:00Z","timestamp":1706753520000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10386531\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,12,15]]},"references-count":27,"URL":"https:\/\/doi.org\/10.1109\/bigdata59044.2023.10386531","relation":{},"subject":[],"published":{"date-parts":[[2023,12,15]]}}}