{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,26]],"date-time":"2025-03-26T07:37:35Z","timestamp":1742974655446,"version":"3.40.3"},"publisher-location":"Cham","reference-count":34,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031610561"},{"type":"electronic","value":"9783031610578"}],"license":[{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024]]},"DOI":"10.1007\/978-3-031-61057-8_17","type":"book-chapter","created":{"date-parts":[[2024,6,2]],"date-time":"2024-06-02T20:17:29Z","timestamp":1717359449000},"page":"284-299","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Improving Understandability and\u00a0Control in\u00a0Data Preparation: A Human-Centered Approach"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2808-5619","authenticated-orcid":false,"given":"Emanuele","family":"Pucci","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3820-7870","authenticated-orcid":false,"given":"Camilla","family":"Sancricca","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9804-4009","authenticated-orcid":false,"given":"Salvatore","family":"Andolina","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6062-5174","authenticated-orcid":false,"given":"Cinzia","family":"Cappiello","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0552-8624","authenticated-orcid":false,"given":"Maristella","family":"Matera","sequence":"additional","affiliation":[]},{"given":"Anna","family":"Barberio","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,6,3]]},"reference":[{"key":"17_CR1","unstructured":"Aguilar, L., Dao, D., Gan, S., Gurel, et al.: Ease. ML: a lifecycle management system for MLDev and MLOps. In: Proceedings of Innovative Data Systems Research (2021)"},{"key":"17_CR2","unstructured":"Berti-\u00c9quille, L.: Active reinforcement learning for data preparation: Learn2Clean with human-in-the-loop. In: Proceedings of CIDR 2020 (2020). www.cidrdb.org"},{"key":"17_CR3","unstructured":"Berti-\u00c9quille, L., Comignani, U.: Explaining automated data cleaning with CleanEX. In: Proceedings of XAI 2021 (2021)"},{"issue":"4","key":"17_CR4","doi-asserted-by":"publisher","first-page":"493","DOI":"10.1007\/s00766-020-00333-1","volume":"25","author":"L Chazette","year":"2020","unstructured":"Chazette, L., Schneider, K.: Explainability as a non-functional requirement: challenges and recommendations. Requirements Eng. 25(4), 493\u2013514 (2020)","journal-title":"Requirements Eng."},{"key":"17_CR5","doi-asserted-by":"crossref","unstructured":"Chu, X., et al.: KATARA: a data cleaning system powered by knowledge bases and crowdsourcing. In: Sellis, T.K., Davidson, S.B., Ives, Z.G. (eds.) Proceedings of SIGMOD 2015, pp. 1247\u20131261. ACM (2015)","DOI":"10.1145\/2723372.2749431"},{"key":"17_CR6","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1007\/978-3-030-57321-8_18","volume-title":"Machine Learning and Knowledge Extraction","author":"D Cirqueira","year":"2020","unstructured":"Cirqueira, D., Nedbal, D., Helfert, M., Bezbradica, M.: Scenario-based requirements elicitation for user-centric explainable AI. In: Holzinger, A., Kieseberg, P., Tjoa, A.M., Weippl, E. (eds.) CD-MAKE 2020. LNCS, vol. 12279, pp. 321\u2013341. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-57321-8_18"},{"key":"17_CR7","doi-asserted-by":"publisher","first-page":"106180","DOI":"10.1016\/j.asoc.2020.106180","volume":"90","author":"DC Corrales","year":"2020","unstructured":"Corrales, D.C., Ledezma, A., Corrales, J.C.: A case-based reasoning system for recommendation of data cleaning algorithms in classification and regression tasks. Appl. Soft Comput. 90, 106180 (2020)","journal-title":"Appl. Soft Comput."},{"key":"17_CR8","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"165","DOI":"10.1007\/978-3-031-20627-6_16","volume-title":"Health Information Science","author":"Q Cui","year":"2022","unstructured":"Cui, Q., et al.: HoloCleanX: a multi-source heterogeneous data cleaning solution based on lakehouse. In: Traina, A., Wang, H., Zhang, Y., Siuly, S., Zhou, R., Chen, L. (eds.) HIS 2022. LNCS, vol. 13705, pp. 165\u2013176. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-031-20627-6_16"},{"key":"17_CR9","doi-asserted-by":"publisher","first-page":"113","DOI":"10.1007\/978-3-319-61073-3_5","volume-title":"Requirements Engineering","author":"J Dick","year":"2017","unstructured":"Dick, J., Hull, E., Jackson, K.: Requirements engineering in the problem domain. In: Dick, J., Hull, E., Jackson, K. (eds.) Requirements Engineering, pp. 113\u2013134. Springer, Cham (2017). https:\/\/doi.org\/10.1007\/978-3-319-61073-3_5"},{"key":"17_CR10","doi-asserted-by":"crossref","unstructured":"Eiband, M., Schneider, H., Bilandzic, M., Fazekas-Con, J., Haug, M., Hussmann, H.: Bringing transparency design into practice. In: Proceedings of IUI 2018, pp. 211\u2013223 (2018)","DOI":"10.1145\/3172944.3172961"},{"issue":"3","key":"17_CR11","doi-asserted-by":"publisher","first-page":"391","DOI":"10.1080\/10447318.2022.2153320","volume":"39","author":"OO Garibay","year":"2023","unstructured":"Garibay, O.O., et al.: Six human-centered artificial intelligence grand challenges. Int. J. Hum.-Comput. Interact. 39(3), 391\u2013437 (2023). https:\/\/doi.org\/10.1080\/10447318.2022.2153320","journal-title":"Int. J. Hum.-Comput. Interact."},{"key":"17_CR12","unstructured":"Gupta, N., et al.: Data quality toolkit: Automatic assessment of data quality and remediation for machine learning datasets. CoRR abs\/2108.05935 (2021)"},{"key":"17_CR13","unstructured":"Hall, M., et al.: A systematic method to understand requirements for explainable AI (XAI) systems. In: Proceedings of XAI 2019, Macau, China (2019)"},{"issue":"6","key":"17_CR14","doi-asserted-by":"publisher","first-page":"1844","DOI":"10.1073\/pnas.1807184115","volume":"116","author":"J Heer","year":"2019","unstructured":"Heer, J.: Agency plus automation: designing artificial intelligence into interactive systems. Proc. Natl. Acad. Sci. 116(6), 1844\u20131850 (2019)","journal-title":"Proc. Natl. Acad. Sci."},{"key":"17_CR15","doi-asserted-by":"crossref","unstructured":"Issa, O., Bonifati, A., Toumani, F.: INCA: inconsistency-aware data profiling and querying. In: Proceedings of SIGMOD 2021, pp. 2745\u20132749 (2021)","DOI":"10.1145\/3448016.3452760"},{"issue":"2","key":"17_CR16","first-page":"90","volume":"9","author":"Y Kim","year":"2020","unstructured":"Kim, Y., Lee, K., Oh, U.: Understanding interactive and explainable feedback for supporting non-experts with data preparation for building a deep learning model. Int. J. Adv. Smart Convergence 9(2), 90\u2013104 (2020)","journal-title":"Int. J. Adv. Smart Convergence"},{"key":"17_CR17","doi-asserted-by":"crossref","unstructured":"Liao, Q.V., Gruen, D., Miller, S.: Questioning the AI: informing design practices for explainable AI user experiences. In: Proceedings of CHI 2020, pp. 1\u201315 (2020)","DOI":"10.1145\/3313831.3376590"},{"key":"17_CR18","doi-asserted-by":"crossref","unstructured":"Luo, Y., Chai, C., Qin, X., Tang, N., Li, G.: Interactive cleaning for progressive visualization through composite questions. In: Proceedings of ICDE 2020, pp. 733\u2013744 (2020)","DOI":"10.1109\/ICDE48307.2020.00069"},{"key":"17_CR19","doi-asserted-by":"publisher","unstructured":"MacNeil, S., Tran, A., Mogil, D., Bernstein, S., Ross, E., Huang, Z.: Generating diverse code explanations using the GPT-3 large language model. In: Vahrenhold, J., Fisler, K., Hauswirth, M., Franklin, D. (eds.) ICER 2022: ACM Conference on International Computing Education Research, Lugano and Virtual Event Switzerland, 7\u201311 August 2022, vol. 2, pp. 37\u201339. ACM (2022). https:\/\/doi.org\/10.1145\/3501709.3544280","DOI":"10.1145\/3501709.3544280"},{"key":"17_CR20","unstructured":"Mahdavi, M., Abedjan, Z.: Semi-supervised data cleaning with Raha and Baran. In: 11th Conference on Innovative Data Systems Research, CIDR 2021, Virtual Event, 11\u201315 January 2021, Online Proceedings (2021). www.cidrdb.org"},{"key":"17_CR21","series-title":"Lecture Notes in Business Information Processing","doi-asserted-by":"publisher","first-page":"532","DOI":"10.1007\/978-3-030-37453-2_43","volume-title":"Business Process Management Workshops","author":"N Martin","year":"2019","unstructured":"Martin, N., Martinez-Millana, A., Valdivieso, B., Fern\u00e1ndez-Llatas, C.: Interactive data cleaning for process mining: a case study of an outpatient clinic\u2019s appointment system. In: Di Francescomarino, C., Dijkman, R., Zdun, U. (eds.) BPM 2019. LNBIP, vol. 362, pp. 532\u2013544. Springer, Cham (2019). https:\/\/doi.org\/10.1007\/978-3-030-37453-2_43"},{"key":"17_CR22","unstructured":"McGregor, S., Paeth, K., Lam, K.: Indexing AI risks with incidents, issues, and variants. arXiv preprint arXiv:2211.10384 (2022)"},{"key":"17_CR23","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.artint.2018.07.007","volume":"267","author":"T Miller","year":"2019","unstructured":"Miller, T.: Explanation in artificial intelligence: insights from the social sciences. Artif. Intell. 267, 1\u201338 (2019)","journal-title":"Artif. Intell."},{"issue":"12","key":"17_CR24","doi-asserted-by":"publisher","first-page":"1860","DOI":"10.14778\/2824032.2824086","volume":"8","author":"T Papenbrock","year":"2015","unstructured":"Papenbrock, T., Bergmann, T., Finke, M., Zwiener, J., Naumann, F.: Data profiling with metanome. Proc. VLDB Endow. 8(12), 1860\u20131863 (2015)","journal-title":"Proc. VLDB Endow."},{"key":"17_CR25","doi-asserted-by":"crossref","unstructured":"Parulian, N.N., Lud\u00e4scher, B.: DCM explorer: a tool to support transparent data cleaning through provenance exploration. In: Proceedings of Theory and Practice of Provenance 2022, pp.\u00a01\u20136 (2022)","DOI":"10.1145\/3530800.3534539"},{"key":"17_CR26","doi-asserted-by":"crossref","unstructured":"Ribeiro, M.T., Singh, S., Guestrin, C.: \u201cWhy should i trust you?\": explaining the predictions of any classifier. In: Proceedings of KDD 2016, KDD 2016, pp. 1135\u20131144. ACM (2016)","DOI":"10.18653\/v1\/N16-3020"},{"key":"17_CR27","doi-asserted-by":"crossref","unstructured":"Rosson, M.B., Carroll, J.M.: Scenario-based design. In: The Human-Computer Interaction Handbook, pp. 1067\u20131086. CRC Press (2007)","DOI":"10.1201\/9781410615862-67"},{"key":"17_CR28","unstructured":"Sancricca, C., Cappiello, C.: Supporting the design of data preparation pipelines. In: Proceedings of the SEBD 2022. CEUR Workshop Proceedings, vol.\u00a03194, pp. 149\u2013158. CEUR-WS.org (2022)"},{"key":"17_CR29","doi-asserted-by":"publisher","unstructured":"Sarsa, S., Denny, P., Hellas, A., Leinonen, J.: Automatic generation of programming exercises and code explanations using large language models. In: Vahrenhold, J., Fisler, K., Hauswirth, M., Franklin, D. (eds.) ICER 2022: ACM Conference on International Computing Education Research, Lugano and Virtual Event, Switzerland, 7\u201311 August 2022, vol. 1, pp. 27\u201343. ACM (2022). https:\/\/doi.org\/10.1145\/3501385.3543957","DOI":"10.1145\/3501385.3543957"},{"key":"17_CR30","unstructured":"Shimizu, T., Omori, H., Yoshikawa, M.: Toward a view-based data cleaning architecture. arXiv preprint arXiv:1910.11040 (2019)"},{"key":"17_CR31","doi-asserted-by":"publisher","first-page":"89","DOI":"10.1016\/j.inffus.2021.05.009","volume":"76","author":"G Vilone","year":"2021","unstructured":"Vilone, G., Longo, L.: Notions of explainability and evaluation approaches for explainable artificial intelligence. Inf. Fusion 76, 89\u2013106 (2021)","journal-title":"Inf. Fusion"},{"issue":"4","key":"17_CR32","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1080\/07421222.1996.11518099","volume":"12","author":"RY Wang","year":"1996","unstructured":"Wang, R.Y., Strong, D.M.: Beyond accuracy: what data quality means to data consumers. J. Manag. Inf. Syst. 12(4), 5\u201333 (1996)","journal-title":"J. Manag. Inf. Syst."},{"key":"17_CR33","doi-asserted-by":"crossref","unstructured":"Wolf, C.T.: Explainability scenarios: towards scenario-based XAI design. In: Proceedings of IUI 2019, pp. 252\u2013257 (2019)","DOI":"10.1145\/3301275.3302317"},{"key":"17_CR34","doi-asserted-by":"crossref","unstructured":"Yan, C., He, Y.: Auto-suggest: learning-to-recommend data preparation steps using data science notebooks. In: Proceedings of SIGMOD 2020, pp. 1539\u20131554 (2020)","DOI":"10.1145\/3318464.3389738"}],"container-title":["Lecture Notes in Computer Science","Advanced Information Systems Engineering"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-61057-8_17","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,6,2]],"date-time":"2024-06-02T20:19:44Z","timestamp":1717359584000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-61057-8_17"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024]]},"ISBN":["9783031610561","9783031610578"],"references-count":34,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-61057-8_17","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2024]]},"assertion":[{"value":"3 June 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"CAiSE","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Advanced Information Systems Engineering","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Limassol","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Cyprus","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"3 June 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"7 June 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"36","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"caise2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/cyprusconferences.org\/caise2024\/#","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}