{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,6]],"date-time":"2025-12-06T05:03:36Z","timestamp":1764997416540,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":75,"publisher":"ACM","license":[{"start":{"date-parts":[[2022,2,11]],"date-time":"2022-02-11T00:00:00Z","timestamp":1644537600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"Swiss National Science Foundation","award":["200021_185043"],"award-info":[{"award-number":["200021_185043"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2022,2,11]]},"DOI":"10.1145\/3488560.3498496","type":"proceedings-article","created":{"date-parts":[[2022,2,15]],"date-time":"2022-02-15T21:42:57Z","timestamp":1644961377000},"page":"16-26","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":6,"title":["Wikipedia Reader Navigation"],"prefix":"10.1145","author":[{"given":"Akhil","family":"Arora","sequence":"first","affiliation":[{"name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne, Lausanne, Switzerland"}]},{"given":"Martin","family":"Gerlach","sequence":"additional","affiliation":[{"name":"Wikimedia Foundation, San Francisco, CA, USA"}]},{"given":"Tiziano","family":"Piccardi","sequence":"additional","affiliation":[{"name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne, Lausanne, Switzerland"}]},{"given":"Alberto","family":"Garc\u00eda-Dur\u00e1n","sequence":"additional","affiliation":[{"name":"Atinary Technologies, Lausanne, Switzerland"}]},{"given":"Robert","family":"West","sequence":"additional","affiliation":[{"name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne, Lausanne, Switzerland"}]}],"member":"320","published-online":{"date-parts":[[2022,2,15]]},"reference":[{"key":"e_1_3_2_2_1_1","doi-asserted-by":"publisher","DOI":"10.1145\/3274290"},{"key":"e_1_3_2_2_2_1","doi-asserted-by":"publisher","DOI":"10.1145\/2872427.2883024"},{"key":"e_1_3_2_2_3_1","volume-title":"[n.d.]. Word vectors for 157 languages. https:\/\/fasttext.cc\/docs\/en\/crawl-vectors.html . accessed","author":"Bojanowski P.","year":"2021","unstructured":"P. Bojanowski, E. Grave, A. Joulin, and T. Mikolov. [n.d.]. Word vectors for 157 languages. https:\/\/fasttext.cc\/docs\/en\/crawl-vectors.html . accessed: 13 August 2021."},{"key":"e_1_3_2_2_4_1","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00051"},{"key":"e_1_3_2_2_5_1","doi-asserted-by":"publisher","DOI":"10.1016\/0169--7552(95)00043--7"},{"key":"e_1_3_2_2_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/2187836.2187919"},{"key":"e_1_3_2_2_7_1","volume-title":"The Wiki Game. https:\/\/www.thewikigame.com\/. accessed","author":"Clemesha Alex","year":"2021","unstructured":"Alex Clemesha. [n.d.]. The Wiki Game. https:\/\/www.thewikigame.com\/. accessed: 13 August 2021."},{"key":"e_1_3_2_2_8_1","doi-asserted-by":"crossref","unstructured":"Cristian Consonni David Laniado and Alberto Montresor. 2019. WikiLinkGraphs: A Complete Longitudinal and Multi-Language Dataset of the Wikipedia Link Networks . (2019) 598--607.","DOI":"10.1609\/icwsm.v13i01.3257"},{"key":"e_1_3_2_2_9_1","doi-asserted-by":"publisher","DOI":"10.1098\/rspa.2019.0740"},{"key":"e_1_3_2_2_10_1","volume-title":"Extrapolating paths with graph neural networks. arXiv preprint arXiv:1903.07518","author":"Cordonnier Jean-Baptiste","year":"2019","unstructured":"Jean-Baptiste Cordonnier and Andreas Loukas. 2019. Extrapolating paths with graph neural networks. arXiv preprint arXiv:1903.07518 (2019)."},{"key":"e_1_3_2_2_11_1","volume-title":"Proc. ICWSM .","author":"Dallmann Alexander","year":"2016","unstructured":"Alexander Dallmann, Thomas Niebler, Florian Lemmerich, and Andreas Hotho. 2016. Extracting semantics from random walks on wikipedia: Comparing learning and counting methods. In Proc. ICWSM ."},{"key":"e_1_3_2_2_12_1","article-title":"Different topic, different trafic: How search and navigation interplay on wikipedia","volume":"1","author":"Dimitrov Dimitar","year":"2019","unstructured":"Dimitar Dimitrov, Florian Lemmerich, Fabian Fl\u00f6ck, and Markus Strohmaier. 2019. Different topic, different trafic: How search and navigation interplay on wikipedia. The Journal of Web Science , Vol. 1 (2019).","journal-title":"The Journal of Web Science"},{"key":"e_1_3_2_2_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/2872518.2889388"},{"key":"e_1_3_2_2_14_1","doi-asserted-by":"publisher","DOI":"10.1145\/3038912.3052613"},{"key":"e_1_3_2_2_15_1","volume-title":"Analytics Datasets: Clickstream. https:\/\/dumps.wikimedia.org\/other\/clickstream\/readme.html . accessed","author":"Foundation Wikimedia","year":"2021","unstructured":"Wikimedia Foundation. [n.d.] a. Analytics Datasets: Clickstream. https:\/\/dumps.wikimedia.org\/other\/clickstream\/readme.html . accessed: 13 August 2021."},{"key":"e_1_3_2_2_16_1","volume-title":"Analytics Datasets: Pageviews. https:\/\/dumps.wikimedia.org\/other\/pageviews\/readme.html . accessed","author":"Foundation Wikimedia","year":"2021","unstructured":"Wikimedia Foundation. [n.d.] b. Analytics Datasets: Pageviews. https:\/\/dumps.wikimedia.org\/other\/pageviews\/readme.html . accessed: 13 August 2021."},{"key":"e_1_3_2_2_17_1","volume-title":"https:\/\/en.wikipedia.org\/wiki\/Infobox . accessed","author":"Foundation Wikimedia","year":"2021","unstructured":"Wikimedia Foundation. [n.d.] c. Infobox. https:\/\/en.wikipedia.org\/wiki\/Infobox . accessed: 13 August 2021."},{"key":"e_1_3_2_2_18_1","volume-title":"https:\/\/dumps.wikimedia.org\/backup-index.html . accessed","author":"Foundation Wikimedia","year":"2021","unstructured":"Wikimedia Foundation. [n.d.] d. Wikimedia Downloads. https:\/\/dumps.wikimedia.org\/backup-index.html . accessed: 13 August 2021."},{"key":"e_1_3_2_2_19_1","volume-title":"Wikimedia Privacy Policy. https:\/\/foundation.wikimedia.org\/wiki\/Privacy_policy . accessed","author":"Foundation Wikimedia","year":"2021","unstructured":"Wikimedia Foundation. [n.d.] e. Wikimedia Privacy Policy. https:\/\/foundation.wikimedia.org\/wiki\/Privacy_policy . accessed: 13 August 2021."},{"key":"e_1_3_2_2_20_1","volume-title":"Wikipedia Pageviews Analysis Tool. https:\/\/pageviews.toolforge.org . accessed","author":"Foundation Wikimedia","year":"2021","unstructured":"Wikimedia Foundation. [n.d.] f. Wikipedia Pageviews Analysis Tool. https:\/\/pageviews.toolforge.org . accessed: 13 August 2021."},{"key":"e_1_3_2_2_21_1","volume-title":"https:\/\/en.wikipedia.org\/wiki\/Wikipedia:WikiProject_Council\/Directory . accessed","author":"Wikimedia Foundation. [n.d.] g. WikiProject Council","year":"2021","unstructured":"Wikimedia Foundation. [n.d.] g. WikiProject Council\/Directory. https:\/\/en.wikipedia.org\/wiki\/Wikipedia:WikiProject_Council\/Directory . accessed: 13 August 2021."},{"key":"e_1_3_2_2_22_1","volume-title":"Wikistats: Pageview complete dumps. https:\/\/dumps.wikimedia.org\/other\/pageview_complete\/readme.html . accessed","author":"Foundation Wikimedia","year":"2021","unstructured":"Wikimedia Foundation. [n.d.] h. Wikistats: Pageview complete dumps. https:\/\/dumps.wikimedia.org\/other\/pageview_complete\/readme.html . accessed: 13 August 2021."},{"key":"e_1_3_2_2_23_1","volume-title":"Wikimedia Webrequest Server Logs . https:\/\/wikitech.wikimedia.org\/wiki\/Analytics\/Data_Lake\/Traffic\/Webrequest . accessed","author":"Foundation Wikimedia","year":"2021","unstructured":"Wikimedia Foundation. 2015. Wikimedia Webrequest Server Logs . https:\/\/wikitech.wikimedia.org\/wiki\/Analytics\/Data_Lake\/Traffic\/Webrequest . accessed: 13 August 2021."},{"key":"e_1_3_2_2_24_1","volume-title":"The memory remains: Understanding collective memory in the digital age. Science advances","author":"Garc'ia-Gavilanes Ruth","year":"2017","unstructured":"Ruth Garc'ia-Gavilanes, Anders Mollgaard, Milena Tsvetkova, and Taha Yasseri. 2017. The memory remains: Understanding collective memory in the digital age. Science advances , Vol. 3, 4 (2017)."},{"key":"e_1_3_2_2_25_1","doi-asserted-by":"publisher","DOI":"10.1145\/2809563.2809598"},{"key":"e_1_3_2_2_26_1","doi-asserted-by":"crossref","unstructured":"Patrick Gildersleve and Taha Yasseri. 2018. Inspiration Captivation and Misdirection: Emergent Properties in Networks of Online Navigation. In Complex Networks IX. 271--282.","DOI":"10.1007\/978-3-319-73198-8_23"},{"key":"e_1_3_2_2_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/2700171.2791036"},{"key":"e_1_3_2_2_28_1","volume-title":"Learning Word Vectors for 157 Languages. arXiv preprint arXiv:1802.06893","author":"Grave Edouard","year":"2018","unstructured":"Edouard Grave, Piotr Bojanowski, Prakhar Gupta, Armand Joulin, and Tomas Mikolov. 2018. Learning Word Vectors for 157 Languages. arXiv preprint arXiv:1802.06893 (2018)."},{"key":"e_1_3_2_2_29_1","volume-title":"Text processing utilities for MediaWiki. https:\/\/github.com\/mediawiki-utilities\/python-mwtext . accessed","author":"Halfaker Aaron","year":"2021","unstructured":"Aaron Halfaker and Gabriel Altay. [n.d.]. Text processing utilities for MediaWiki. https:\/\/github.com\/mediawiki-utilities\/python-mwtext . accessed: 13 August 2021."},{"key":"e_1_3_2_2_30_1","volume-title":"The WikiTax Taxonomy. https:\/\/github.com\/wikimedia\/wikitax . accessed","author":"Halfaker Aaron","year":"2021","unstructured":"Aaron Halfaker and Isaac Johnson. [n.d.]. The WikiTax Taxonomy. https:\/\/github.com\/wikimedia\/wikitax . accessed: 13 August 2021."},{"key":"e_1_3_2_2_31_1","doi-asserted-by":"publisher","DOI":"10.1145\/2736277.2741117"},{"key":"e_1_3_2_2_32_1","doi-asserted-by":"publisher","DOI":"10.1145\/2481492.2481502"},{"key":"e_1_3_2_2_33_1","volume-title":"2021 a. Language-agnostic Topic Classification for Wikipedia. arXiv preprint arXiv:2103.00068","author":"Johnson Isaac","year":"2021","unstructured":"Isaac Johnson, Martin Gerlach, and Diego S\u00e1ez-Trumper. 2021 a. Language-agnostic Topic Classification for Wikipedia. arXiv preprint arXiv:2103.00068 (2021)."},{"key":"e_1_3_2_2_34_1","doi-asserted-by":"publisher","DOI":"10.1609\/icwsm.v15i1.18058"},{"key":"e_1_3_2_2_35_1","volume-title":"Web Routineness and Limits of Predictability: Investigating Demographic and Behavioral Differences Using Web Tracking Data. arXiv preprint arXiv:2012.15112","author":"Kulshrestha Juhi","year":"2020","unstructured":"Juhi Kulshrestha, Marcos Oliveira, Orkut Karacalik, Denis Bonnay, and Claudia Wagner. 2020. Web Routineness and Limits of Predictability: Investigating Demographic and Behavioral Differences Using Web Tracking Data. arXiv preprint arXiv:2012.15112 (2020)."},{"key":"e_1_3_2_2_36_1","doi-asserted-by":"publisher","DOI":"10.1080\/13614568.2016.1179798"},{"key":"e_1_3_2_2_37_1","doi-asserted-by":"publisher","DOI":"10.2139\/ssrn.3739176"},{"key":"e_1_3_2_2_38_1","doi-asserted-by":"publisher","DOI":"10.1145\/2631775.2631805"},{"key":"e_1_3_2_2_39_1","doi-asserted-by":"publisher","DOI":"10.1145\/3289600.3291021"},{"key":"e_1_3_2_2_40_1","doi-asserted-by":"publisher","DOI":"10.1038\/s41562-020-00985-7"},{"key":"e_1_3_2_2_41_1","volume-title":"Wikipedia's Network Bias on Controversial Topics. arXiv preprint arXiv:2007.08197","author":"Menghini Cristina","year":"2020","unstructured":"Cristina Menghini, Aris Anagnostopoulos, and Eli Upfal. 2020. Wikipedia's Network Bias on Controversial Topics. arXiv preprint arXiv:2007.08197 (2020)."},{"key":"e_1_3_2_2_42_1","first-page":"878","article-title":"WikiHist.html","volume":"14","author":"Mitrevski Blagoj","year":"2020","unstructured":"Blagoj Mitrevski, Tiziano Piccardi, and Robert West. 2020. WikiHist.html: English Wikipedia's Full Revision History in HTML Format. Proc. ICWSM , Vol. 14 (2020), 878--884.","journal-title":"English Wikipedia's Full Revision History in HTML Format. Proc. ICWSM"},{"key":"e_1_3_2_2_43_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W18-3026"},{"key":"e_1_3_2_2_44_1","doi-asserted-by":"publisher","DOI":"10.1145\/2835776.2835832"},{"key":"e_1_3_2_2_45_1","doi-asserted-by":"publisher","DOI":"10.5555\/1953048.2078195"},{"key":"e_1_3_2_2_46_1","doi-asserted-by":"crossref","unstructured":"Bryan Perozzi Rami Al-Rfou and Steven Skiena. 2014. DeepWalk: Online Learning of Social Representations. In KDD . 701--710.","DOI":"10.1145\/2623330.2623732"},{"key":"e_1_3_2_2_47_1","volume-title":"Learning the Markov order of paths in a network. arXiv preprint arXiv:2007.02861","author":"Petrovi\u0107 Luka V","year":"2020","unstructured":"Luka V Petrovi\u0107 and Ingo Scholtes. 2020. Learning the Markov order of paths in a network. arXiv preprint arXiv:2007.02861 (2020)."},{"key":"e_1_3_2_2_48_1","volume-title":"A Large-Scale Characterization of How Readers Browse Wikipedia. arXiv preprint arXiv:2112.11848","author":"Piccardi Tiziano","year":"2021","unstructured":"Tiziano Piccardi, Martin Gerlach, Akhil Arora, and Robert West. 2021. A Large-Scale Characterization of How Readers Browse Wikipedia. arXiv preprint arXiv:2112.11848 (2021)."},{"key":"e_1_3_2_2_49_1","doi-asserted-by":"publisher","DOI":"10.1145\/3190616"},{"key":"e_1_3_2_2_50_1","volume-title":"A Taxonomy of Knowledge Gaps for Wikimedia Projects (Second Draft). arXiv preprint arXiv:2008.12314","author":"Redi Miriam","year":"2020","unstructured":"Miriam Redi, Martin Gerlach, Isaac Johnson, Jonathan Morgan, and Leila Zia. 2020. A Taxonomy of Knowledge Gaps for Wikimedia Projects (Second Draft). arXiv preprint arXiv:2008.12314 (2020)."},{"key":"e_1_3_2_2_51_1","volume-title":"Sudden Attention Shifts on Wikipedia Following COVID-19 Mobility Restrictions. arXiv preprint arXiv:2005.08505","author":"Ribeiro Manoel Horta","year":"2020","unstructured":"Manoel Horta Ribeiro, Kristina Gligori\u0107, Maxime Peyrard, Florian Lemmerich, Markus Strohmaier, and Robert West. 2020. Sudden Attention Shifts on Wikipedia Following COVID-19 Mobility Restrictions. arXiv preprint arXiv:2005.08505 (2020)."},{"key":"e_1_3_2_2_52_1","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0170746"},{"key":"e_1_3_2_2_53_1","volume-title":"Memory in network flows and its effects on spreading dynamics and community detection. Nature communications","author":"Rosvall Martin","year":"2014","unstructured":"Martin Rosvall, Alcides V Esquivel, Andrea Lancichinetti, Jevin D West, and Renaud Lambiotte. 2014. Memory in network flows and its effects on spreading dynamics and community detection. Nature communications , Vol. 5 (2014)."},{"key":"e_1_3_2_2_54_1","doi-asserted-by":"publisher","DOI":"10.1145\/3308560.3316753"},{"key":"e_1_3_2_2_55_1","doi-asserted-by":"publisher","DOI":"10.1145\/2556195.2556232"},{"key":"e_1_3_2_2_56_1","doi-asserted-by":"publisher","DOI":"10.1145\/2910896.2910908"},{"volume-title":"Scikit-learn: Adjusted Mutual Information Score. https:\/\/scikit-learn.org\/stable\/modules\/generated\/sklearn.metrics.adjusted_mutual_info_score.html . accessed","year":"2021","key":"e_1_3_2_2_57_1","unstructured":"Scikit-learn. [n.d.]. Scikit-learn: Adjusted Mutual Information Score. https:\/\/scikit-learn.org\/stable\/modules\/generated\/sklearn.metrics.adjusted_mutual_info_score.html . accessed: 13 August 2021."},{"key":"e_1_3_2_2_58_1","doi-asserted-by":"publisher","DOI":"10.1145\/3213769"},{"key":"e_1_3_2_2_59_1","doi-asserted-by":"publisher","DOI":"10.1093\/joc\/jqx003"},{"key":"e_1_3_2_2_60_1","doi-asserted-by":"publisher","DOI":"10.1145\/2567948.2567956"},{"key":"e_1_3_2_2_61_1","doi-asserted-by":"publisher","DOI":"10.1145\/2736277.2741080"},{"key":"e_1_3_2_2_62_1","doi-asserted-by":"crossref","unstructured":"Philipp Singer Denis Helic Behnam Taraghi and Markus Strohmaier. 2014. Detecting Memory and Structure in Human Navigation Patterns Using Markov Chain Models of Varying Order.","DOI":"10.1371\/journal.pone.0102070"},{"key":"e_1_3_2_2_63_1","doi-asserted-by":"publisher","DOI":"10.1145\/3038912.3052716"},{"key":"e_1_3_2_2_64_1","doi-asserted-by":"publisher","DOI":"10.4018\/ijswis.2013100103"},{"key":"e_1_3_2_2_65_1","volume-title":"The WikiSRS Dataset. https:\/\/github.com\/OSU-slatelab\/WikiSRS . accessed","author":"Slatelab OSU","year":"2021","unstructured":"OSU Slatelab. [n.d.]. The WikiSRS Dataset. https:\/\/github.com\/OSU-slatelab\/WikiSRS . accessed: 13 August 2021."},{"key":"e_1_3_2_2_66_1","doi-asserted-by":"publisher","DOI":"10.1145\/258549.258816"},{"key":"e_1_3_2_2_67_1","doi-asserted-by":"publisher","DOI":"10.1145\/3306446.3340829"},{"key":"e_1_3_2_2_68_1","doi-asserted-by":"publisher","DOI":"10.1145\/1553374.1553511"},{"key":"e_1_3_2_2_69_1","volume-title":"Proc. ICWSM .","author":"Warncke-Wang Morten","year":"2015","unstructured":"Morten Warncke-Wang, Vivek Ranjan, Loren Terveen, and Brent Hecht. 2015. Misalignment between supply and demand of quality content in peer production communities. In Proc. ICWSM ."},{"key":"e_1_3_2_2_70_1","volume-title":"https:\/\/dlab.epfl.ch\/wikispeedia . accessed","author":"West Robert","year":"2021","unstructured":"Robert West. [n.d.]. Wikispeedia. https:\/\/dlab.epfl.ch\/wikispeedia . accessed: 13 August 2021."},{"key":"e_1_3_2_2_71_1","doi-asserted-by":"publisher","DOI":"10.1145\/2187836.2187920"},{"key":"e_1_3_2_2_72_1","volume-title":"Proc. IJCAI . 1598--1603","author":"West Robert","year":"2009","unstructured":"Robert West, Joelle Pineau, and Doina Precup. 2009. Wikispeedia: An Online Game for Inferring Semantic Distances between Concepts. In Proc. IJCAI . 1598--1603."},{"key":"e_1_3_2_2_73_1","volume-title":"Wikipedia Navigation Vectors. https:\/\/meta.wikimedia.org\/wiki\/Research:Wikipedia_Navigation_Vectors . accessed","author":"Wulczyn Ellery","year":"2021","unstructured":"Ellery Wulczyn. [n.d.]. Wikipedia Navigation Vectors. https:\/\/meta.wikimedia.org\/wiki\/Research:Wikipedia_Navigation_Vectors . accessed: 13 August 2021."},{"key":"e_1_3_2_2_74_1","unstructured":"Ellery Wulczyn and Dario Taraborelli. 2015. Wikipedia clickstream. https:\/\/meta.wikimedia.org\/wiki\/Research:Wikipedia_clickstream ."},{"key":"e_1_3_2_2_75_1","doi-asserted-by":"publisher","DOI":"10.6084\/m9.figshare.7698245.v1"}],"event":{"name":"WSDM '22: The Fifteenth ACM International Conference on Web Search and Data Mining","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data","SIGIR ACM Special Interest Group on Information Retrieval"],"location":"Virtual Event AZ USA","acronym":"WSDM '22"},"container-title":["Proceedings of the Fifteenth ACM International Conference on Web Search and Data Mining"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3488560.3498496","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3488560.3498496","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T19:31:19Z","timestamp":1750188679000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3488560.3498496"}},"subtitle":["When Synthetic Data Is Enough"],"short-title":[],"issued":{"date-parts":[[2022,2,11]]},"references-count":75,"alternative-id":["10.1145\/3488560.3498496","10.1145\/3488560"],"URL":"https:\/\/doi.org\/10.1145\/3488560.3498496","relation":{},"subject":[],"published":{"date-parts":[[2022,2,11]]},"assertion":[{"value":"2022-02-15","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}