{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,27]],"date-time":"2025-10-27T20:44:27Z","timestamp":1761597867629},"reference-count":40,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2017,10,20]],"date-time":"2017-10-20T00:00:00Z","timestamp":1508457600000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Distrib Parallel Databases"],"published-print":{"date-parts":[[2018,3]]},"DOI":"10.1007\/s10619-017-7211-3","type":"journal-article","created":{"date-parts":[[2017,10,20]],"date-time":"2017-10-20T10:22:09Z","timestamp":1508494929000},"page":"47-79","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["Web-scale provenance reconstruction of implicit information diffusion on social media"],"prefix":"10.1007","volume":"36","author":[{"given":"Io","family":"Taxidou","sequence":"first","affiliation":[]},{"given":"Sven","family":"Lieber","sequence":"additional","affiliation":[]},{"given":"Peter M.","family":"Fischer","sequence":"additional","affiliation":[]},{"given":"Tom","family":"De Nies","sequence":"additional","affiliation":[]},{"given":"Ruben","family":"Verborgh","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2017,10,20]]},"reference":[{"key":"7211_CR1","doi-asserted-by":"crossref","unstructured":"Aierken, A., Davis, D.B., Zhang, Q., Gupta, K., Wong, A., Asuncion, H.U.: A multi-level funneling approach to data provenance reconstruction. In: IEEE 10th International Conference on e-Science, vol 2, pp. 71\u201374, IEEE (2014)","DOI":"10.1109\/eScience.2014.54"},{"issue":"3","key":"7211_CR2","doi-asserted-by":"crossref","first-page":"665","DOI":"10.1007\/s10115-010-0360-6","volume":"28","author":"M Al Hasan","year":"2011","unstructured":"Al Hasan, M., Salem, S., Zaki, M.J.: Simclus: an effective algorithm for clustering with a lower bound on similarity. Knowl. Inf. Syst. 28(3), 665\u2013685 (2011)","journal-title":"Knowl. Inf. Syst."},{"issue":"3","key":"7211_CR3","doi-asserted-by":"crossref","first-page":"364","DOI":"10.3390\/a5030364","volume":"5","author":"J Azzopardi","year":"2012","unstructured":"Azzopardi, J., Staff, C.: Incremental clustering of news reports. Algorithms 5(3), 364\u2013378 (2012)","journal-title":"Algorithms"},{"key":"7211_CR4","doi-asserted-by":"crossref","unstructured":"Bakshy, E., Hofman, J.M., Mason, W.A., Watts, D.J.: Everyone\u2019s an influencer: quantifying influence on twitter. In: Proceedings of the 4th ACM International Conference on Web Search and Data Mining, pp. 65\u201374 (2011)","DOI":"10.1145\/1935826.1935845"},{"issue":"1","key":"7211_CR5","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1140\/epjds18","volume":"2","author":"RA Ba\u00f1os","year":"2013","unstructured":"Ba\u00f1os, R.A., Borge-Holthoefer, J., Moreno, Y.: The role of hidden influentials in the diffusion of online information cascades. EPJ Data Sci. 2(1), 1\u201316 (2013)","journal-title":"EPJ Data Sci."},{"issue":"1","key":"7211_CR6","doi-asserted-by":"crossref","first-page":"1","DOI":"10.2200\/S00496ED1V01Y201304DMK007","volume":"4","author":"G Barbier","year":"2013","unstructured":"Barbier, G., Feng, Z., Gundecha, P., Liu, H.: Provenance data in social media. Synth. Lect. Data Min. Knowl. Discov. 4(1), 1\u201384 (2013)","journal-title":"Synth. Lect. Data Min. Knowl. Discov."},{"key":"7211_CR7","doi-asserted-by":"crossref","unstructured":"Barbosa, S., Cesar, R.M. Jr., Cosley, D.: Using text similarity to detect social interactions not captured by formal reply mechanisms. In: 2015 IEEE 11th International Conference on e-Science (e-Science), pp. 36\u201346. IEEE (2015)","DOI":"10.1109\/eScience.2015.31"},{"key":"7211_CR8","doi-asserted-by":"crossref","unstructured":"Blei, D.M., Lafferty, J.D.: Dynamic topic models. In: Proceedings of the 23rd International Conference on Machine Learning, pp. 113\u2013120 (2006)","DOI":"10.1145\/1143844.1143859"},{"issue":"10\u201317","key":"7211_CR9","first-page":"30","volume":"10","author":"M Cha","year":"2010","unstructured":"Cha, M., Haddadi, H., Benevenuto, F., Gummadi, P.K.: Measuring user influence in Twitter: the million follower fallacy. ICWSM 10(10\u201317), 30 (2010)","journal-title":"ICWSM"},{"issue":"4","key":"7211_CR10","doi-asserted-by":"crossref","first-page":"379","DOI":"10.1561\/1900000006","volume":"1","author":"J Cheney","year":"2009","unstructured":"Cheney, J., Chiticariu, L., Tan, W.C., et al.: Provenance in databases: why, how, and where. Found. Trends\u00ae Databases 1(4), 379\u2013474 (2009)","journal-title":"Found. Trends\u00ae Databases"},{"key":"7211_CR11","doi-asserted-by":"crossref","unstructured":"Comarela, G., Crovella, M., Almeida, V., Benevenuto, F.: Understanding factors that affect response rates in Twitter. In: Proceedings of the 23rd ACM Conference on Hypertext and Social Media, pp. 123\u2013132 (2012)","DOI":"10.1145\/2309996.2310017"},{"issue":"4","key":"7211_CR12","first-page":"44","volume":"30","author":"SB Davidson","year":"2007","unstructured":"Davidson, S.B., Boulakia, S.C., Eyal, A., Lud\u00e4scher, B., McPhillips, T.M., Bowers, S., Anand, M.K., Freire, J.: Provenance in scientific workflow systems. IEEE Data Eng. Bull. 30(4), 44\u201350 (2007)","journal-title":"IEEE Data Eng. Bull."},{"key":"7211_CR13","doi-asserted-by":"crossref","unstructured":"De Nies, T., Coppens, S., Van Deursen, D., Mannens, E., Van de Walle, R.: Automatic discovery of high-level provenance using semantic similarity. In: IPAW (2012)","DOI":"10.1007\/978-3-642-34222-6_8"},{"key":"7211_CR14","doi-asserted-by":"crossref","unstructured":"De Nies, T., Taxidou, I., Dimou, A., Verborgh, R., Fischer, P.M., Mannens, E., Van de Walle, R.: Towards multi-level provenance reconstruction of information diffusion on social media. In: Proceedings of the 24th ACM International on Conference on Information and Knowledge Management, pp. 1823\u20131826 (2015)","DOI":"10.1145\/2806416.2806642"},{"key":"7211_CR15","doi-asserted-by":"crossref","unstructured":"De Nies, T., Mannens, E., Van de Walle, R.: Reconstructing human-generated provenance through similarity-based clustering. In: International Provenance and Annotation Workshop, Springer, pp. 191\u2013194 (2016)","DOI":"10.1007\/978-3-319-40593-3_19"},{"key":"7211_CR16","doi-asserted-by":"crossref","unstructured":"Feng, Z., Gundecha, P., Liu, H.: Recovering information recipients in social media via provenance. In: ASONAM, pp. 706\u2013711 (2013)","DOI":"10.1145\/2492517.2492629"},{"key":"7211_CR17","doi-asserted-by":"crossref","unstructured":"Glavic, B., Sheykh Esmaili, K., Fischer, P.M., Tatbul, N.: Ariadne: Managing fine-grained provenance on data streams. In: Proceedings of the 7th ACM International Conference on Distributed Event-Based Systems, pp. 39\u201350 (2013)","DOI":"10.1145\/2488222.2488256"},{"key":"7211_CR18","doi-asserted-by":"crossref","unstructured":"Gundecha, P., Liu, H.: Mining social media: a brief introduction. In: New Directions in Informatics, Optimization, Logistics, and Production, Informs, pp. 1\u201317 (2012)","DOI":"10.1287\/educ.1120.0105"},{"key":"7211_CR19","doi-asserted-by":"crossref","unstructured":"Gundecha, P., Ranganath, S., Feng, Z., Liu, H.: A tool for collecting provenance data in social media. In: Proceedings of the 19th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp. 1462\u20131465. ACM (2013b)","DOI":"10.1145\/2487575.2487713"},{"key":"7211_CR20","doi-asserted-by":"crossref","unstructured":"Jaho, E., Tzoannos, E., Papadopoulos, A., Sarris, N.: Alethiometer: a framework for assessing trustworthiness and content validity in social media. In: Proceedings of the 23rd International Conference on World Wide Web, pp. 749\u2013752. ACM (2014)","DOI":"10.1145\/2567948.2579324"},{"issue":"1","key":"7211_CR21","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1007\/s11280-007-0018-9","volume":"11","author":"S Khy","year":"2008","unstructured":"Khy, S., Ishikawa, Y., Kitagawa, H.: A novelty-based clustering method for on-line documents. World Wide Web 11(1), 1\u201337 (2008)","journal-title":"World Wide Web"},{"key":"7211_CR22","unstructured":"Kov\u00e1cs, F., Leg\u00e1ny, C., Babos, A.: Cluster validity measurement techniques. In: 6th International Symposium of Hungarian Researchers on Computational Intelligence, Citeseer (2005)"},{"issue":"2","key":"7211_CR23","doi-asserted-by":"crossref","first-page":"249","DOI":"10.1007\/s10115-010-0342-8","volume":"29","author":"P Kranen","year":"2011","unstructured":"Kranen, P., Assent, I., Baldauf, C., Seidl, T.: The clustree: indexing micro-clusters for anytime stream mining. Knowl. Inf. Syst. 29(2), 249\u2013272 (2011)","journal-title":"Knowl. Inf. Syst."},{"key":"7211_CR24","doi-asserted-by":"crossref","unstructured":"Kwon, S., Cha, M., Jung, K., Chen, W., Wang, Y.: Prominent features of rumor propagation in online social media. In: 2013 IEEE 13th International Conference on Data Mining (ICDM), pp. 1103\u20131108. IEEE (2013)","DOI":"10.1109\/ICDM.2013.61"},{"key":"7211_CR25","doi-asserted-by":"crossref","unstructured":"Leskovec, J., Backstrom, L., Kleinberg, J.: Meme-tracking and the dynamics of the news cycle. In: Proceedings of the 15th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp. 497\u2013506 (2009)","DOI":"10.1145\/1557019.1557077"},{"key":"7211_CR26","doi-asserted-by":"crossref","unstructured":"Magliacane, S.: Reconstructing provenance. In: Proceedings of the 11th International Conference on The Semantic Web-Volume Part II, pp. 399\u2013406. Springer, New York (2012)","DOI":"10.1007\/978-3-642-35173-0_29"},{"issue":"6106","key":"7211_CR27","doi-asserted-by":"crossref","first-page":"472","DOI":"10.1126\/science.1230456","volume":"338","author":"PT Metaxas","year":"2012","unstructured":"Metaxas, P.T., Mustafaraj, E.: Social media and the elections. Science 338(6106), 472\u2013473 (2012)","journal-title":"Science"},{"issue":"2\u20133","key":"7211_CR28","doi-asserted-by":"crossref","first-page":"99","DOI":"10.1561\/1800000010","volume":"2","author":"L Moreau","year":"2010","unstructured":"Moreau, L.: The foundations for provenance on the web. Found. Trends Web Sci. 2(2\u20133), 99\u2013241 (2010)","journal-title":"Found. Trends Web Sci."},{"key":"7211_CR29","doi-asserted-by":"crossref","unstructured":"Moreau, L., Missier, P.: (Eds) W3C Provenance Working Group (2013) PROV-DM: The PROV Data Model. W3C","DOI":"10.2200\/S00528ED1V01Y201308WBE007"},{"key":"7211_CR30","doi-asserted-by":"crossref","first-page":"53","DOI":"10.1016\/0377-0427(87)90125-7","volume":"20","author":"PJ Rousseeuw","year":"1987","unstructured":"Rousseeuw, P.J.: Silhouettes: a graphical aid to the interpretation and validation of cluster analysis. J. Comput. Appl. Math. 20, 53\u201365 (1987)","journal-title":"J. Comput. Appl. Math."},{"key":"7211_CR31","doi-asserted-by":"crossref","unstructured":"Sakaki, T., Okazaki, M., Matsuo, Y.: Earthquake shakes twitter users: real-time event detection by social sensors. In: Proceedings of the 19th International Conference on World Wide web, pp. 851\u2013860. ACM (2010)","DOI":"10.1145\/1772690.1772777"},{"key":"7211_CR32","volume-title":"Introduction to Modern Information Retrieval","author":"G Salton","year":"1986","unstructured":"Salton, G., McGill, M.J.: Introduction to Modern Information Retrieval. McGraw-Hill, New York (1986)"},{"key":"7211_CR33","volume-title":"Applied Multivariate Techniques","author":"S Sharma","year":"1995","unstructured":"Sharma, S.: Applied Multivariate Techniques. Wiley, New York (1995)"},{"key":"7211_CR34","unstructured":"Simmons, M.P., Adamic, L.A., Adar, E.: Memes online: Extracted, subtracted, injected, and recollected. In: Fifth International AAAI Conference on Weblogs and Social Media (2011)"},{"key":"7211_CR35","doi-asserted-by":"crossref","unstructured":"Suen, C., Huang, S., Eksombatchai, C., Sosic, R., Leskovec, J.: NIFTY: a system for large scale information flow tracking and clustering. In: Proceedings of the 22nd International Conference on World Wide Web, pp. 1237\u20131248. ACM (2013)","DOI":"10.1145\/2488388.2488496"},{"key":"7211_CR36","doi-asserted-by":"crossref","unstructured":"Taxidou, I., Fischer, P.M.: Online analysis of information diffusion in twitter. In: Proceedings of the 23rd International Conference on World Wide Web, WWW \u201914 Companion (2014)","DOI":"10.1145\/2567948.2580050"},{"key":"7211_CR37","doi-asserted-by":"crossref","unstructured":"Taxidou, I., De Nies, T., Verborgh, R., Fischer, P., Mannens, E., Van de Walle, R.: Modeling information diffusion in social media as provenance with W3C PROV. In: Proceedings of the 6th International Workshop on Modeling Social Media, pp. 819\u2013824 (2015)","DOI":"10.1145\/2740908.2742475"},{"key":"7211_CR38","doi-asserted-by":"crossref","unstructured":"Taxidou, I., Fischer, PM., De Nies, T., Mannens, E., Van de Walle, R.: Information diffusion and provenance of interactions in twitter: Is it only about retweets? In: Proceedings of the 25th International Conference Companion on World Wide Web, pp. 113\u2013114 (2016)","DOI":"10.1145\/2872518.2889393"},{"issue":"4","key":"7211_CR39","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/1852102.1852106","volume":"28","author":"W Webber","year":"2010","unstructured":"Webber, W., Moffat, A., Zobel, J.: A similarity measure for indefinite rankings. ACM Trans. Inf. Syst. 28(4), 1\u201320 (2010)","journal-title":"ACM Trans. Inf. Syst."},{"key":"7211_CR40","doi-asserted-by":"crossref","unstructured":"Yang, J., Leskovec, J.: Modeling information diffusion in implicit networks. In: 2010 IEEE International Conference on Data Mining, pp. 599\u2013608 (2010)","DOI":"10.1109\/ICDM.2010.22"}],"container-title":["Distributed and Parallel Databases"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10619-017-7211-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10619-017-7211-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10619-017-7211-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,10,4]],"date-time":"2019-10-04T19:39:08Z","timestamp":1570217948000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10619-017-7211-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,10,20]]},"references-count":40,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2018,3]]}},"alternative-id":["7211"],"URL":"https:\/\/doi.org\/10.1007\/s10619-017-7211-3","relation":{},"ISSN":["0926-8782","1573-7578"],"issn-type":[{"value":"0926-8782","type":"print"},{"value":"1573-7578","type":"electronic"}],"subject":[],"published":{"date-parts":[[2017,10,20]]}}}