{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,21]],"date-time":"2025-08-21T16:27:56Z","timestamp":1755793676895,"version":"3.40.4"},"reference-count":56,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2021,11,9]],"date-time":"2021-11-09T00:00:00Z","timestamp":1636416000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2021,11,9]],"date-time":"2021-11-09T00:00:00Z","timestamp":1636416000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Data Sci Anal"],"published-print":{"date-parts":[[2022,6]]},"DOI":"10.1007\/s41060-021-00287-9","type":"journal-article","created":{"date-parts":[[2021,11,9]],"date-time":"2021-11-09T13:02:42Z","timestamp":1636462962000},"page":"65-87","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Big social data provenance framework for Zero-Information Loss Key-Value Pair (KVP) Database"],"prefix":"10.1007","volume":"14","author":[{"given":"Asma","family":"Rani","sequence":"first","affiliation":[]},{"given":"Navneet","family":"Goyal","sequence":"additional","affiliation":[]},{"given":"Shashi K.","family":"Gadia","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2021,11,9]]},"reference":[{"key":"287_CR1","doi-asserted-by":"crossref","unstructured":"Agrawal, R., Imran, A., Seay, C., Walker, J.: A layer based architecture for provenance in big data. In: 2014 IEEE International Conference on Big Data (Big Data), pp.1\u20137. IEEE (2014)","DOI":"10.1109\/BigData.2014.7004468"},{"key":"287_CR2","unstructured":"Akoush, S., Sohan, R., Hopper, A.: Hadoopprov: towards provenance as a first class citizen in mapreduce. In: Presented as Part of the 5th $$\\{$$USENIX$$\\}$$ Workshop on the Theory and Practice of Provenance (2013)"},{"key":"287_CR3","doi-asserted-by":"crossref","unstructured":"Barbier, G., Feng, Z., Gundecha, P., Liu, H.: Provenance data in social media. In: Provenance Data in Social Media (2013)","DOI":"10.1007\/978-3-031-01904-3"},{"issue":"1","key":"287_CR4","doi-asserted-by":"publisher","first-page":"76","DOI":"10.1109\/69.204093","volume":"5","author":"G Bhargava","year":"1993","unstructured":"Bhargava, G., Gadia, S.K.: Relational database systems with zero information loss. IEEE Trans. Knowl. Data Eng. 5(1), 76\u201387 (1993)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"issue":"5","key":"287_CR5","doi-asserted-by":"publisher","first-page":"66","DOI":"10.1109\/MIS.2016.86","volume":"31","author":"L Cao","year":"2016","unstructured":"Cao, L.: Data science: nature and pitfalls. IEEE Intell. Syst. 31(5), 66\u201375 (2016)","journal-title":"IEEE Intell. Syst."},{"issue":"3","key":"287_CR6","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3076253","volume":"50","author":"L Cao","year":"2017","unstructured":"Cao, L.: Data science: a comprehensive overview. ACM Comput. Surv. (CSUR) 50(3), 1\u201342 (2017)","journal-title":"ACM Comput. Surv. (CSUR)"},{"key":"287_CR7","doi-asserted-by":"crossref","unstructured":"Chacko, A., Kumar, S.M.: Big data provenance research directions. In: TENCON 2017-2017 IEEE Region 10 Conference, pp. 651\u2013656. IEEE (2017)","DOI":"10.1109\/TENCON.2017.8227942"},{"issue":"2","key":"287_CR8","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/1365815.1365816","volume":"26","author":"F Chang","year":"2008","unstructured":"Chang, F., Dean, J., Ghemawat, S., Hsieh, W.C., Wallach, D.A., Burrows, M., Chandra, T., Fikes, A., Gruber, R.E.: Bigtable: a distributed storage system for structured data. ACM Trans. Comput. Syst. (TOCS) 26(2), 1\u201326 (2008)","journal-title":"ACM Trans. Comput. Syst. (TOCS)"},{"key":"287_CR9","doi-asserted-by":"crossref","unstructured":"Che, D., Safran, M., Peng, Z.: From big data to big data mining: challenges, issues, and opportunities. In: International Conference on Database Systems for Advanced Applications, pp. 1\u201315. Springer (2013)","DOI":"10.1007\/978-3-642-40270-8_1"},{"key":"287_CR10","doi-asserted-by":"crossref","unstructured":"Cheah, Y.W., Canon, R., Plale, B., Ramakrishnan, L.: Milieu: lightweight and configurable big data provenance for science. In: 2013 IEEE International Congress on Big Data, pp. 46\u201353. IEEE (2013)","DOI":"10.1109\/BigData.Congress.2013.16"},{"key":"287_CR11","doi-asserted-by":"crossref","unstructured":"Chebotko, A., Kashlev, A., Lu, S.: A big data modeling methodology for apache cassandra. In: 2015 IEEE International Congress on Big Data, pp. 238\u2013245. IEEE (2015)","DOI":"10.1109\/BigDataCongress.2015.41"},{"key":"287_CR12","doi-asserted-by":"crossref","unstructured":"Corsar, D., Markovic, M., Edwards, P.: Social media data in research: provenance challenges. In: International Provenance and Annotation Workshop, pp. 195\u2013198. Springer (2016)","DOI":"10.1007\/978-3-319-40593-3_20"},{"key":"287_CR13","doi-asserted-by":"crossref","unstructured":"Crawl, D., Wang, J., Altintas, I.: Provenance for mapreduce-based data-intensive workflows. In: Proceedings of the 6th Workshop on Workflows in Support of Large-scale Science, pp. 21\u201330 (2011)","DOI":"10.1145\/2110497.2110501"},{"key":"287_CR14","doi-asserted-by":"crossref","unstructured":"Cuzzocrea, A.: Provenance research issues and challenges in the big data era. In: 2015 IEEE 39th Annual Computer Software and Applications Conference, vol.\u00a03, pp. 684\u2013686. IEEE (2015)","DOI":"10.1109\/COMPSAC.2015.345"},{"key":"287_CR15","unstructured":"Cuzzocrea, A.M.: Big data provenance: State-of-the-art analysis and emerging research challenges. In: Workshops of the EDBT\/ICDT 2016 Joint Conference, EDBT\/ICDT 2016, CEUR-WS, vol. 1558 (2016)"},{"key":"287_CR16","doi-asserted-by":"crossref","unstructured":"De\u00a0Nies, T., Taxidou, I., Dimou, A., Verborgh, R., Fischer, P.M., Mannens, E., Van\u00a0de, Walle, R.: Towards multi-level provenance reconstruction of information diffusion on social media. In: Proceedings of the 24th ACM International on Conference on Information and Knowledge Management, pp. 1823\u20131826 (2015)","DOI":"10.1145\/2806416.2806642"},{"key":"287_CR17","doi-asserted-by":"crossref","unstructured":"DeCandia, G., Hastorun, D., Jampani, M., Kakulapati, G., Lakshman, A., Pilchin, A., Sivasubramanian, S., Vosshall, P., Vogels, W.: Dynamo: Amazon\u2019s highly available key-value store. ACM SIGOPS Oper. Syst. Rev. 41(6), 205\u2013220 (2007)","DOI":"10.1145\/1323293.1294281"},{"key":"287_CR18","doi-asserted-by":"publisher","first-page":"267","DOI":"10.1016\/j.engappai.2018.04.009","volume":"72","author":"AM Fathollahi-Fard","year":"2018","unstructured":"Fathollahi-Fard, A.M., Hajiaghaei-Keshteli, M., Tavakkoli-Moghaddam, R.: The social engineering optimizer (seo). Eng. Appl. Artif. Intell. 72, 267\u2013293 (2018)","journal-title":"Eng. Appl. Artif. Intell."},{"key":"287_CR19","doi-asserted-by":"publisher","first-page":"106103","DOI":"10.1016\/j.cie.2019.106103","volume":"137","author":"AM Fathollahi-Fard","year":"2019","unstructured":"Fathollahi-Fard, A.M., Ranjbar-Bourani, M., Cheikhrouhou, N., Hajiaghaei-Keshteli, M.: Novel modifications of social engineering optimizer to solve a truck scheduling problem in a cross-docking system. Comput. Ind. Eng. 137, 106103 (2019)","journal-title":"Comput. Ind. Eng."},{"key":"287_CR20","unstructured":"Featherston, D.: Cassandra: Principles and Application. Department of Computer Science University of Illinois at Urbana-champaign (2010)"},{"key":"287_CR21","first-page":"2768","volume-title":"Social Provenance","author":"Z Feng","year":"2018","unstructured":"Feng, Z., Gundecha, P., Liu, H.: Social Provenance, pp. 2768\u20132772. Springer, New York (2018)"},{"key":"287_CR22","doi-asserted-by":"crossref","unstructured":"Ghoshal, D., Plale, B.: Provenance from log files: a bigdata problem. In: Proceedings of the Joint EDBT\/ICDT 2013 Workshops, pp. 290\u2013297 (2013)","DOI":"10.1145\/2457317.2457366"},{"key":"287_CR23","doi-asserted-by":"crossref","unstructured":"Glavic, B.: Big data provenance: challenges and implications for benchmarking. In: Specifying Big Data Benchmarks, pp. 72\u201380. Springer (2012)","DOI":"10.1007\/978-3-642-53974-9_7"},{"key":"287_CR24","unstructured":"Glavic, B., Miller, R.J.: Reexamining some holy grails of data provenance. TaPP 11:3rd(2011)"},{"key":"287_CR25","doi-asserted-by":"crossref","unstructured":"Gundecha, P., Feng, Z., Liu, H.: Seeking provenance of information using social media. In: Proceedings of the 22nd ACM International Conference on Information and Knowledge Management, pp. 1691\u20131696 (2013)","DOI":"10.1145\/2505515.2505633"},{"key":"287_CR26","doi-asserted-by":"publisher","first-page":"2822","DOI":"10.1016\/j.procs.2015.05.441","volume":"51","author":"R Hernandez","year":"2015","unstructured":"Hernandez, R., Becerra, Y., Torres, J., Ayguad\u00e9, E.: Automatic query driven data modelling in cassandra. Procedia Comput. Sci. 51, 2822\u20132826 (2015)","journal-title":"Procedia Comput. Sci."},{"key":"287_CR27","doi-asserted-by":"crossref","unstructured":"Hondo, F., Wercelens, P., da\u00a0Silva, W., Castro, K., Santana, I., Walter, M.E., Ara\u00fajo, A., Holanda, M., Lifschitz, S.: Data provenance management for bioinformatics workflows using nosql database systems in a cloud computing environment. In: 2017 IEEE International Conference on Bioinformatics and Biomedicine (BIBM), pp. 1929\u20131934. IEEE (2017)","DOI":"10.1109\/BIBM.2017.8217954"},{"key":"287_CR28","unstructured":"Ikeda, R., Park, H., Widom, J.: Provenance for generalized map and reduce workflows (2011)"},{"issue":"1","key":"287_CR29","doi-asserted-by":"publisher","first-page":"59","DOI":"10.1016\/j.bushor.2009.09.003","volume":"53","author":"AM Kaplan","year":"2010","unstructured":"Kaplan, A.M., Haenlein, M.: Users of the world, unite! the challenges and opportunities of social media. Bus. Horizons 53(1), 59\u201368 (2010)","journal-title":"Bus. Horizons"},{"key":"287_CR30","unstructured":"Kerchner, D., Littman, J., Peterson, C., Smallen, V., Trent, R., Wrubel, L.: The Provenance of a Tweet (2019)"},{"key":"287_CR31","doi-asserted-by":"crossref","unstructured":"Kulkarni, D.: A fine-grained access control model for key-value systems. In: Proceedings of the Third ACM Conference on Data and Application Security and Privacy, pp. 161\u2013164 (2013a)","DOI":"10.1145\/2435349.2435370"},{"key":"287_CR32","unstructured":"Kulkarni, D.: A provenance model for key-value systems. In: Presented as Part of the 5th $$\\{$$USENIX$$\\}$$ Workshop on the Theory and Practice of Provenance (2013b)"},{"issue":"2","key":"287_CR33","doi-asserted-by":"publisher","first-page":"35","DOI":"10.1145\/1773912.1773922","volume":"44","author":"A Lakshman","year":"2010","unstructured":"Lakshman, A., Malik, P.: Cassandra: a decentralized structured storage system. ACM SIGOPS Oper. Syst. Rev. 44(2), 35\u201340 (2010)","journal-title":"ACM SIGOPS Oper. Syst. Rev."},{"key":"287_CR34","unstructured":"Li, F., Zhao, Y., Felsche, K., Xu, G., Cao, L.: Coupling Analysis Between Twitter and Call Centre (2015). arXiv preprint arXiv:1509.02238"},{"key":"287_CR35","doi-asserted-by":"crossref","unstructured":"Mahmood, K.: Performance comparison of nosql database cassandra and sql server for large databases. J. Independ. Stud. Res. (JISR) 14(2) (2016)","DOI":"10.31645\/jisrc\/(2016).14.2.0003"},{"key":"287_CR36","unstructured":"Markovic, M., Edwards, P., Corsar, D.: A role for provenance in social computation. In: Proceedings of the First International Workshop on Crowdsourcing the Semantic Web-CrowdSem 2013, CEUR-WS (2013)"},{"issue":"1","key":"287_CR37","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s40537-017-0063-x","volume":"4","author":"E Olshannikova","year":"2017","unstructured":"Olshannikova, E., Olsson, T., Huhtam\u00e4ki, J., K\u00e4rkk\u00e4inen, H.: Conceptualizing big social data. J. Big Data 4(1), 1\u201319 (2017)","journal-title":"J. Big Data"},{"key":"287_CR38","doi-asserted-by":"crossref","unstructured":"Papavasileiou, V., Yocum, K., Deutsch, A.: Ariadne: Online provenance for big graph analytics. In: Proceedings of the 2019 International Conference on Management of Data, pp. 521\u2013536 (2019)","DOI":"10.1145\/3299869.3300091"},{"issue":"12","key":"287_CR39","doi-asserted-by":"publisher","first-page":"1351","DOI":"10.14778\/3402755.3402768","volume":"4","author":"H Park","year":"2011","unstructured":"Park, H., Ikeda, R., Widom, J.: Ramp: a system for capturing and tracing provenance in mapreduce workflows. Proc. VLDB Endow. 4(12), 1351\u20131354 (2011)","journal-title":"Proc. VLDB Endow."},{"key":"287_CR40","doi-asserted-by":"crossref","unstructured":"Ramesh, D., Kumar, A.: Query driven implementation of twitter base using cassandra. In: 2018 International Conference on Current Trends towards Converging Technologies (ICCTCT), pp. 1\u20134. IEEE (2018)","DOI":"10.1109\/ICCTCT.2018.8551136"},{"key":"287_CR41","unstructured":"Ramusat, Y., Maniu, S., Senellart, P.: Semiring provenance over graph databases. In: 10th $$\\{$$USENIX$$\\}$$ Workshop on the Theory and Practice of Provenance (TaPP 2018) (2018)"},{"key":"287_CR42","doi-asserted-by":"crossref","unstructured":"Ranganath, S., Gundecha, P., Liu, H.: A tool for assisting provenance search in social media. In: Proceedings of the 22nd ACM International Conference on Information and Knowledge Management, pp. 2517\u20132520 (2013)","DOI":"10.1145\/2505515.2508214"},{"key":"287_CR43","doi-asserted-by":"crossref","unstructured":"Rani, A., Goyal, N., Gadia, S.K.: Data provenance for historical queries in relational database. In: Proceedings of the 8th Annual ACM India Conference, pp. 117\u2013122 (2015)","DOI":"10.1145\/2835043.2835047"},{"key":"287_CR44","doi-asserted-by":"crossref","unstructured":"Rani, A., Goyal, N., Gadia, S.K.: Efficient multi-depth querying on provenance of relational queries using graph database. In: Proceedings of the 9th Annual ACM India Conference, pp. 11\u201320 (2016)","DOI":"10.1145\/2998476.2998480"},{"key":"287_CR45","doi-asserted-by":"publisher","first-page":"87","DOI":"10.1007\/978-3-030-69377-0_8","volume-title":"Databases Theory and Applications","author":"A Rani","year":"2021","unstructured":"Rani, A., Goyal, N., Gadia, S.K.: Twitter data modelling and provenance support for key-value pair databases. In: Qiao, M., Vossen, G., Wang, S., Li, L. (eds.) Databases Theory and Applications, pp. 87\u201398. Springer, Cham (2021a)"},{"key":"287_CR46","doi-asserted-by":"crossref","unstructured":"Rani, A., Goyal, N., K\u00a0Gadia, S.: Provenance framework for twitter data using zero-information loss graph database. In: 8th ACM IKDD CODS and 26th COMAD, pp. 74\u201382 (2021b)","DOI":"10.1145\/3430984.3431014"},{"issue":"1","key":"287_CR47","doi-asserted-by":"publisher","first-page":"1534519","DOI":"10.1080\/23311916.2018.1534519","volume":"5","author":"AP Rodrigues","year":"2018","unstructured":"Rodrigues, A.P., Chiplunkar, N.N.: Real-time twitter data analysis using hadoop ecosystem. Cogent Eng. 5(1), 1534519 (2018)","journal-title":"Cogent Eng."},{"key":"287_CR48","doi-asserted-by":"crossref","unstructured":"Schmidt, F.M., Geyer, C., Schaeffer-Filho, A., DeBloch, S., Hu, Y.: Change data capture in nosql databases: a functional and performance comparison. In: 2015 IEEE Symposium on Computers and Communication (ISCC), pp. 562\u2013567. IEEE (2015)","DOI":"10.1109\/ISCC.2015.7405574"},{"key":"287_CR49","doi-asserted-by":"publisher","first-page":"104","DOI":"10.1007\/978-3-030-31423-1_3","volume-title":"Reasoning Web, Explainable Artificial Intelligence","author":"P Senellart","year":"2019","unstructured":"Senellart, P.: Provenance in databases: principles and applications. In: Reasoning Web, Explainable Artificial Intelligence, pp. 104\u2013109. Springer, Cham (2019)"},{"key":"287_CR50","unstructured":"Simmhan, Y.L., Plale, B., Gannon, D.: A Survey of Data Provenance Techniques, vol. 47405, p. 69. Computer Science Department, Indiana University, Bloomington (2005)"},{"key":"287_CR51","doi-asserted-by":"crossref","unstructured":"Taxidou, I., De\u00a0Nies, T., Verborgh, R., Fischer, P.M., Mannens, E., Van\u00a0de, Walle, R.: Modeling information diffusion in social media as provenance with w3c prov. In: Proceedings of the 24th International Conference on World Wide Web, pp. 819\u2013824 (2015)","DOI":"10.1145\/2740908.2742475"},{"issue":"1","key":"287_CR52","doi-asserted-by":"publisher","first-page":"47","DOI":"10.1007\/s10619-017-7211-3","volume":"36","author":"I Taxidou","year":"2018","unstructured":"Taxidou, I., Lieber, S., Fischer, P.M., De Nies, T., Verborgh, R.: Web-scale provenance reconstruction of implicit information diffusion on social media. Distrib. Parallel Datab. 36(1), 47\u201379 (2018)","journal-title":"Distrib. Parallel Datab."},{"key":"287_CR53","doi-asserted-by":"crossref","unstructured":"Wang, J., Crawl, D., Purawat, S., Nguyen, M., Altintas, I.: Big data provenance: challenges, state of the art and opportunities. In: 2015 IEEE International Conference on Big Data (Big Data), pp. 2509\u20132516. IEEE (2015)","DOI":"10.1109\/BigData.2015.7364047"},{"key":"287_CR54","first-page":"19","volume":"2017","author":"IM Yazici","year":"2017","unstructured":"Yazici, I.M., Aktas, M.S., Gokturk, M.: A novel approach to user involved big data provenance visualization. DBKDA 2017, 19 (2017)","journal-title":"DBKDA"},{"issue":"12","key":"287_CR55","doi-asserted-by":"publisher","first-page":"5523","DOI":"10.3390\/app11125523","volume":"11","author":"Q Ye","year":"2021","unstructured":"Ye, Q., Lu, M.: s2p: provenance research for stream processing system. Appl. Sci. 11(12), 5523 (2021)","journal-title":"Appl. Sci."},{"issue":"4","key":"287_CR56","doi-asserted-by":"publisher","first-page":"663","DOI":"10.3390\/sym13040663","volume":"13","author":"C Zhang","year":"2021","unstructured":"Zhang, C., Fathollahi-Fard, A.M., Li, J., Tian, G., Zhang, T.: Disassembly sequence planning for intelligent manufacturing using social engineering optimizer. Symmetry 13(4), 663 (2021)","journal-title":"Symmetry"}],"container-title":["International Journal of Data Science and Analytics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41060-021-00287-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s41060-021-00287-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41060-021-00287-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,9]],"date-time":"2025-04-09T09:56:09Z","timestamp":1744192569000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s41060-021-00287-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,11,9]]},"references-count":56,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2022,6]]}},"alternative-id":["287"],"URL":"https:\/\/doi.org\/10.1007\/s41060-021-00287-9","relation":{},"ISSN":["2364-415X","2364-4168"],"issn-type":[{"type":"print","value":"2364-415X"},{"type":"electronic","value":"2364-4168"}],"subject":[],"published":{"date-parts":[[2021,11,9]]},"assertion":[{"value":"22 April 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 September 2021","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 November 2021","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"On behalf of all authors, the corresponding author states that there is no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of Interest"}}]}}