{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,22]],"date-time":"2026-03-22T06:10:44Z","timestamp":1774159844323,"version":"3.50.1"},"publisher-location":"Cham","reference-count":45,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783319929002","type":"print"},{"value":"9783319929019","type":"electronic"}],"license":[{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018]]},"DOI":"10.1007\/978-3-319-92901-9_3","type":"book-chapter","created":{"date-parts":[[2018,6,6]],"date-time":"2018-06-06T06:27:41Z","timestamp":1528266461000},"page":"24-38","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":16,"title":["CrowdCorrect: A Curation Pipeline for Social Data Cleansing and Curation"],"prefix":"10.1007","author":[{"given":"Amin","family":"Beheshti","sequence":"first","affiliation":[]},{"given":"Kushal","family":"Vaghani","sequence":"additional","affiliation":[]},{"given":"Boualem","family":"Benatallah","sequence":"additional","affiliation":[]},{"given":"Alireza","family":"Tabebordbar","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,6,7]]},"reference":[{"key":"3_CR1","first-page":"308","volume":"240","author":"WD Abilhoa","year":"2014","unstructured":"Abilhoa, W.D., De Castro, L.N.: A keyword extraction method from Twitter messages represented as graphs. Appl. Math. Comput. 240, 308\u2013325 (2014)","journal-title":"Appl. Math. Comput."},{"key":"3_CR2","doi-asserted-by":"crossref","unstructured":"Abu-Salih, B., Wongthongtham, P., Beheshti, S., Zhu, D.: A preliminary approach to domain-based evaluation of users\u2019 trustworthiness in online social networks. In: 2015 IEEE International Congress on Big Data, New York City, NY, USA, 27 June\u20132 July 2015, pp. 460\u2013466 (2015)","DOI":"10.1109\/BigDataCongress.2015.74"},{"key":"3_CR3","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/978-1-4419-8462-3","volume-title":"Social Network Data Analytics","author":"Charu C. Aggarwal","year":"2011","unstructured":"Aggarwal, C.C.: An introduction to social network data analytics. In: Social Network Data Analytics, pp. 1\u201315 (2011)"},{"key":"3_CR4","unstructured":"Anderson, M., et al.: Brainwash: a data system for feature engineering. In: CIDR (2013)"},{"issue":"12","key":"3_CR5","doi-asserted-by":"publisher","first-page":"2521","DOI":"10.1002\/asi.22768","volume":"63","author":"Y Bae","year":"2012","unstructured":"Bae, Y., Lee, H.: Sentiment analysis of Twitter audiences: measuring the positive or negative influence of popular Twitterers. J. Assoc. Inf. Sci. Technol. 63(12), 2521\u20132535 (2012)","journal-title":"J. Assoc. Inf. Sci. Technol."},{"issue":"3","key":"3_CR6","doi-asserted-by":"publisher","first-page":"1189","DOI":"10.1007\/s10586-015-0472-6","volume":"18","author":"O Batarfi","year":"2015","unstructured":"Batarfi, O., Shawi, R.E., Fayoumi, A.G., Nouri, R., Beheshti, S., Barnawi, A., Sakr, S.: Large scale graph processing systems: survey and an experimental evaluation. Cluster Comput. 18(3), 1189\u20131213 (2015)","journal-title":"Cluster Comput."},{"issue":"4","key":"3_CR7","doi-asserted-by":"publisher","first-page":"842","DOI":"10.1002\/spe.2558","volume":"48","author":"A Beheshti","year":"2018","unstructured":"Beheshti, A., Benatallah, B., Motahari-Nezhad, H.R.: ProcessAtlas: a scalable and extensible platform for business process analytics. Softw. Pract. Exp. 48(4), 842\u2013866 (2018)","journal-title":"Softw. Pract. Exp."},{"key":"3_CR8","doi-asserted-by":"crossref","unstructured":"Beheshti, A., Benatallah, B., Nouri, R., Chhieng, V.M., Xiong, H., Zhao, X.: Coredb: a data lake service. In: Proceedings of the 2017 ACM on Conference on Information and Knowledge Management, CIKM 2017, Singapore, 06\u201310 November 2017, pp. 2451\u20132454 (2017)","DOI":"10.1145\/3132847.3133171"},{"key":"3_CR9","unstructured":"Beheshti, S., Benatallah, B., Motahari-Nezhad, H.R.: Galaxy: a platform for explorative analysis of open data sources. In: Proceedings of the 19th International Conference on Extending Database Technology, EDBT 2016, Bordeaux, France, 15\u201316 March 2016, pp. 640\u2013643 (2016)"},{"issue":"3","key":"3_CR10","doi-asserted-by":"publisher","first-page":"379","DOI":"10.1007\/s10619-014-7171-9","volume":"34","author":"S Beheshti","year":"2016","unstructured":"Beheshti, S., Benatallah, B., Motahari-Nezhad, H.R.: Scalable graph-based OLAP analytics over process execution data. Distrib. Parallel Databases 34(3), 379\u2013423 (2016)","journal-title":"Distrib. Parallel Databases"},{"key":"3_CR11","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-25037-3","volume-title":"Process Analytics - Concepts and Techniques for Querying and Analyzing Process Data","author":"S-M-R Beheshti","year":"2016","unstructured":"Beheshti, S.-M.-R., Benatallah, B., Sakr, S., Grigori, D., Motahari-Nezhad, H.R., Barukh, M.C., Gater, A., Ryu, S.H.: Process Analytics - Concepts and Techniques for Querying and Analyzing Process Data. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-25037-3"},{"issue":"4","key":"3_CR12","doi-asserted-by":"publisher","first-page":"313","DOI":"10.1007\/s00607-016-0490-0","volume":"99","author":"S Beheshti","year":"2017","unstructured":"Beheshti, S., Benatallah, B., Venugopal, S., Ryu, S.H., Motahari-Nezhad, H.R., Wang, W.: A systematic review and comparative analysis of cross-document coreference resolution methods and tools. Computing 99(4), 313\u2013349 (2017)","journal-title":"Computing"},{"key":"3_CR13","doi-asserted-by":"publisher","unstructured":"Beheshti, S., Tabebordbar, A., Benatallah, B., Nouri, R.: On automating basic data curation tasks. In: Proceedings of the 26th International Conference on World Wide Web Companion, Perth, Australia, 3\u20137 April 2017, pp. 165\u2013169 (2017). https:\/\/doi.org\/10.1145\/3041021.3054726","DOI":"10.1145\/3041021.3054726"},{"key":"3_CR14","unstructured":"Beheshti, S., Venugopal, S., Ryu, S.H., Benatallah, B., Wang, W.: Big data and cross-document coreference resolution: current state and future opportunities. CoRR abs\/1311.3987 (2013)"},{"key":"3_CR15","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1007\/978-3-319-25037-3_5","volume-title":"Process Analytics","author":"S Beheshti","year":"2016","unstructured":"Beheshti, S., et al.: Business process data analysis. In: Beheshti, S., et al. (eds.) Process Analytics, pp. 107\u2013134. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-25037-3_5"},{"key":"3_CR16","doi-asserted-by":"crossref","unstructured":"Brigadir, I., Greene, D., Cunningham, P.: A system for Twitter user list curation. In: Proceedings of the Sixth ACM Conference on Recommender Systems, pp. 293\u2013294. ACM (2012)","DOI":"10.1145\/2365952.2366019"},{"issue":"10\u201317","key":"3_CR17","first-page":"30","volume":"10","author":"M Cha","year":"2010","unstructured":"Cha, M., Haddadi, H., Benevenuto, F., Gummadi, P.K.: Measuring user influence in Twitter: the million follower fallacy. ICWSM 10(10\u201317), 30 (2010)","journal-title":"ICWSM"},{"issue":"3","key":"3_CR18","first-page":"4","volume":"36","author":"X Chai","year":"2013","unstructured":"Chai, X., et al.: Social media analytics: the Kosmix story. IEEE Data Eng. Bull. 36(3), 4\u201312 (2013)","journal-title":"IEEE Data Eng. Bull."},{"key":"3_CR19","doi-asserted-by":"crossref","unstructured":"Chitrakala, S.: Twitter data analysis. In: Modern Technologies for Big Data Classification and Clustering, p. 124 (2017)","DOI":"10.4018\/978-1-5225-2805-0.ch005"},{"key":"3_CR20","unstructured":"Duh, K., Hirao, T., Kimura, A., Ishiguro, K., Iwata, T., Yeung, C.M.A.: Creating stories: social curation of Twitter messages. In: ICWSM (2012)"},{"key":"3_CR21","unstructured":"Ginn, R., Pimpalkhute, P., Nikfarjam, A., Patki, A., OConnor, K., Sarker, A., Smith, K., Gonzalez, G.: Mining Twitter for adverse drug reaction mentions: a corpus and classification benchmark. In: Proceedings of the Fourth Workshop on Building and Evaluating Resources for Health and Biomedical Text Processing (2014)"},{"key":"3_CR22","doi-asserted-by":"crossref","unstructured":"Godin, F., Slavkovikj, V., De Neve, W., Schrauwen, B., Van de Walle, R.: Using topic models for Twitter hashtag recommendation. In: Proceedings of the 22nd International Conference on World Wide Web, pp. 593\u2013596. ACM (2013)","DOI":"10.1145\/2487788.2488002"},{"issue":"1","key":"3_CR23","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1145\/2674026.2674029","volume":"16","author":"O Goonetilleke","year":"2014","unstructured":"Goonetilleke, O., Sellis, T., Zhang, X., Sathe, S.: Twitter analytics: a big data management perspective. SIGKDD Explor. Newsl. 16(1), 11\u201320 (2014). https:\/\/doi.org\/10.1145\/2674026.2674029","journal-title":"SIGKDD Explor. Newsl."},{"issue":"6","key":"3_CR24","first-page":"1","volume":"14","author":"J Howe","year":"2006","unstructured":"Howe, J.: The rise of crowdsourcing. Wired Mag. 14(6), 1\u20134 (2006)","journal-title":"Wired Mag."},{"key":"3_CR25","doi-asserted-by":"crossref","unstructured":"Kim, N.W., et al.: BudgetMap: engaging taxpayers in the issue-driven classification of a government budget. In: CSCW, pp. 1026\u20131037 (2016)","DOI":"10.1145\/2818048.2820004"},{"key":"3_CR26","doi-asserted-by":"crossref","unstructured":"Kittur, A., Nickerson, J.V., Bernstein, M., Gerber, E., Shaw, A., Zimmerman, J., Lease, M., Horton, J.: The future of crowd work. In: CSCW (2013)","DOI":"10.1145\/2441776.2441923"},{"issue":"56","key":"3_CR27","doi-asserted-by":"publisher","first-page":"34","DOI":"10.1002\/rwm3.20324","volume":"2016","author":"E Kooge","year":"2016","unstructured":"Kooge, E., et al.: Merging data streams. Res. World 2016(56), 34\u201337 (2016)","journal-title":"Res. World"},{"issue":"Suppl 1","key":"3_CR28","doi-asserted-by":"publisher","first-page":"i200","DOI":"10.1093\/bioinformatics\/bth919","volume":"20","author":"M. Koyuturk","year":"2004","unstructured":"Koyut\u00fcrk, M., Grama, A., Szpankowski, W.: An efficient algorithm for detecting frequent subgraphs in biological networks. Bioinformatics 20(Suppl_1), i200\u2013i207 (2004)","journal-title":"Bioinformatics"},{"key":"3_CR29","doi-asserted-by":"crossref","unstructured":"Krishnan, S., et al.: Towards reliable interactive data cleaning: a user survey and recommendations. In: HILDA@ SIGMOD, p. 9 (2016)","DOI":"10.1145\/2939502.2939511"},{"key":"3_CR30","doi-asserted-by":"crossref","unstructured":"Kwak, H., Lee, C., Park, H., Moon, S.: What is Twitter, a social network or a news media? In: WWW (2010)","DOI":"10.1145\/1772690.1772751"},{"key":"3_CR31","doi-asserted-by":"crossref","unstructured":"Lee, K., Palsetia, D., Narayanan, R., Patwary, M.M.A., Agrawal, A., Choudhary, A.: Twitter trending topic classification. In: 2011 IEEE 11th International Conference on Data Mining Workshops (ICDMW), pp. 251\u2013258. IEEE (2011)","DOI":"10.1109\/ICDMW.2011.171"},{"key":"3_CR32","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"88","DOI":"10.1007\/978-3-642-25953-1_8","volume-title":"The Semantic Web: ESWC 2011 Workshops","author":"D Maynard","year":"2012","unstructured":"Maynard, D., Funk, A.: Automatic detection of political opinions in tweets. In: Garc\u00eda-Castro, R., Fensel, D., Antoniou, G. (eds.) ESWC 2011. LNCS, vol. 7117, pp. 88\u201399. Springer, Heidelberg (2012). https:\/\/doi.org\/10.1007\/978-3-642-25953-1_8"},{"key":"3_CR33","doi-asserted-by":"crossref","unstructured":"Perera, R.D., Anand, S., Subbalakshmi, K., Chandramouli, R.: Twitter analytics: architecture, tools and analysis. In: Military Communications Conference, 2010-MILCOM 2010, pp. 2186\u20132191. IEEE (2010)","DOI":"10.1109\/MILCOM.2010.5680493"},{"issue":"4","key":"3_CR34","first-page":"3","volume":"23","author":"E Rahm","year":"2000","unstructured":"Rahm, E., Do, H.H.: Data cleaning: problems and current approaches. IEEE Data Eng. Bull. 23(4), 3\u201313 (2000)","journal-title":"IEEE Data Eng. Bull."},{"key":"3_CR35","unstructured":"Roberts, K., Roach, M.A., Johnson, J., Guthrie, J., Harabagiu, S.M.: EmpaTweet: annotating and detecting emotions on Twitter. In: LREC, vol. 12, pp. 3806\u20133813 (2012)"},{"issue":"6","key":"3_CR36","doi-asserted-by":"publisher","first-page":"57","DOI":"10.1145\/336460.336475","volume":"43","author":"E Rundensteiner","year":"2000","unstructured":"Rundensteiner, E., et al.: Maintaining data warehouses over changing information sources. Commun. ACM 43(6), 57\u201362 (2000)","journal-title":"Commun. ACM"},{"key":"3_CR37","unstructured":"Russom, P., et al.: Big data analytics. TDWI Best Practices Report, Fourth Quarter, pp. 1\u201335 (2011)"},{"key":"3_CR38","doi-asserted-by":"crossref","unstructured":"Sadeghi, F., et al.: VisKE: visual knowledge extraction and question answering by visual verification of relation phrases. In: CVPR, pp. 1456\u20131464. IEEE (2015)","DOI":"10.1109\/CVPR.2015.7298752"},{"key":"3_CR39","unstructured":"Salih, B.A., Wongthongtham, P., Beheshti, S.M.R., Zajabbari, B.: Towards a methodology for social business intelligence in the era of big social data incorporating trust and semantic analysis. In: Second International Conference on Advanced Data and Information Engineering (DaEng-2015). Springer, Bali (2015)"},{"issue":"2","key":"3_CR40","first-page":"443","volume":"27","author":"W Shen","year":"2015","unstructured":"Shen, W., et al.: Entity linking with a knowledge base: issues, techniques, and solutions. ITKDE 27(2), 443\u2013460 (2015)","journal-title":"ITKDE"},{"key":"3_CR41","unstructured":"Sosamphan, P., et al.: SNET: a statistical normalisation method for Twitter. Master\u2019s thesis (2016)"},{"key":"3_CR42","doi-asserted-by":"crossref","unstructured":"Sriram, B., Fuhry, D., Demir, E., Ferhatosmanoglu, H., Demirbas, M.: Short text classification in Twitter to improve information filtering. In: SIGIR. ACM (2010)","DOI":"10.1145\/1835449.1835643"},{"key":"3_CR43","doi-asserted-by":"crossref","unstructured":"Troncy, R.: Linking entities for enriching and structuring social media content. In: WWW, pp. 597\u2013597 (2016)","DOI":"10.1145\/2872518.2892109"},{"key":"3_CR44","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"216","DOI":"10.1007\/978-3-642-16567-2_16","volume-title":"Social Informatics","author":"S Ye","year":"2010","unstructured":"Ye, S., Wu, S.F.: Measuring message propagation and social influence on Twitter.com. In: Bolc, L., Makowski, M., Wierzbicki, A. (eds.) SocInfo 2010. LNCS, vol. 6430, pp. 216\u2013231. Springer, Heidelberg (2010). https:\/\/doi.org\/10.1007\/978-3-642-16567-2_16"},{"key":"3_CR45","unstructured":"Zhao, W.X., Jiang, J., He, J., Song, Y., Achananuparp, P., Lim, E.P., Li, X.: Topical keyphrase extraction from Twitter. In: Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies, vol. 1, pp. 379\u2013388. Association for Computational Linguistics (2011)"}],"container-title":["Lecture Notes in Business Information Processing","Information Systems in the Big Data Era"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-92901-9_3","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,12]],"date-time":"2024-03-12T15:24:54Z","timestamp":1710257094000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-319-92901-9_3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018]]},"ISBN":["9783319929002","9783319929019"],"references-count":45,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-92901-9_3","relation":{},"ISSN":["1865-1348","1865-1356"],"issn-type":[{"value":"1865-1348","type":"print"},{"value":"1865-1356","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018]]},"assertion":[{"value":"7 June 2018","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"CAiSE","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Advanced Information Systems Engineering","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Tallinn","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Estonia","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2018","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"11 June 2018","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"15 June 2018","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"30","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"caise2018","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/caise2018.ut.ee","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}