{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,25]],"date-time":"2025-03-25T14:42:12Z","timestamp":1742913732422,"version":"3.40.3"},"publisher-location":"Cham","reference-count":38,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031438486"},{"type":"electronic","value":"9783031438493"}],"license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023]]},"DOI":"10.1007\/978-3-031-43849-3_5","type":"book-chapter","created":{"date-parts":[[2023,9,21]],"date-time":"2023-09-21T21:01:25Z","timestamp":1695330085000},"page":"47-61","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["PreprintResolver: Improving Citation Quality by\u00a0Resolving Published Versions of\u00a0ArXiv Preprints Using Literature Databases"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-7540-4980","authenticated-orcid":false,"given":"Louise","family":"Bloch","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5038-5899","authenticated-orcid":false,"given":"Johannes","family":"R\u00fcckert","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7906-0038","authenticated-orcid":false,"given":"Christoph M.","family":"Friedrich","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,9,22]]},"reference":[{"key":"5_CR1","doi-asserted-by":"publisher","unstructured":"Abdill, R.J., Blekhman, R.: Meta-research: tracking the popularity and outcomes of all bioRxiv preprints. eLife 8, e45133 (2019). https:\/\/doi.org\/10.7554\/eLife.45133","DOI":"10.7554\/eLife.45133"},{"key":"5_CR2","doi-asserted-by":"publisher","unstructured":"Accomazzi, A.: ADS Services in support of the Discovery, Management and Evaluation of Science Data. Presentation, December 2015. https:\/\/doi.org\/10.5281\/zenodo.34494","DOI":"10.5281\/zenodo.34494"},{"key":"5_CR3","doi-asserted-by":"publisher","unstructured":"Ammar, W., et al.: Construction of the literature graph in semantic scholar. In: Proceedings of the 2018 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, vol. 3, pp. 84\u201391. Association for Computational Linguistics, New Orleans - Louisiana (2018). https:\/\/doi.org\/10.18653\/v1\/n18-3011, industry Papers","DOI":"10.18653\/v1\/n18-3011"},{"key":"5_CR4","unstructured":"arXiv.org: ArXiv annual report 2022. Technical report (2023). https:\/\/info.arxiv.org\/about\/reports\/2022_arXiv_annual_report.pdf. Accessed 17 May 2023"},{"issue":"6288","key":"5_CR5","doi-asserted-by":"publisher","first-page":"899","DOI":"10.1126\/science.aaf9133","volume":"352","author":"JM Berg","year":"2016","unstructured":"Berg, J.M., et al.: Preprints for the life sciences. Science 352(6288), 899\u2013901 (2016). https:\/\/doi.org\/10.1126\/science.aaf9133","journal-title":"Science"},{"issue":"6","key":"5_CR6","doi-asserted-by":"publisher","first-page":"5285","DOI":"10.1007\/s11192-021-03900-7","volume":"126","author":"G Cabanac","year":"2021","unstructured":"Cabanac, G., Oikonomidi, T., Boutron, I.: Day-to-day discovery of preprint-publication links. Scientometrics 126(6), 5285\u20135304 (2021). https:\/\/doi.org\/10.1007\/s11192-021-03900-7","journal-title":"Scientometrics"},{"key":"5_CR7","unstructured":"Canese, K., Weis, S.: Pubmed: the bibliographic database. In: The NCBI Handbook 2(1) (2013)"},{"key":"5_CR8","doi-asserted-by":"publisher","unstructured":"Cornell University: ArXiv dataset. Dataset (2023). https:\/\/doi.org\/10.34740\/kaggle\/dsv\/5621820","DOI":"10.34740\/kaggle\/dsv\/5621820"},{"issue":"3","key":"5_CR9","doi-asserted-by":"publisher","first-page":"273","DOI":"10.1007\/bf00994018","volume":"20","author":"C Cortes","year":"1995","unstructured":"Cortes, C., Vapnik, V.: Support-vector networks. Mach. Learn. 20(3), 273\u2013297 (1995). https:\/\/doi.org\/10.1007\/bf00994018","journal-title":"Mach. Learn."},{"issue":"2","key":"5_CR10","doi-asserted-by":"publisher","first-page":"203","DOI":"10.1007\/s11192-007-1661-8","volume":"71","author":"PM Davis","year":"2007","unstructured":"Davis, P.M., Fromerth, M.J.: Does the arXiv lead to higher citations and reduced publisher downloads for mathematics articles? Scientometrics 71(2), 203\u2013215 (2007). https:\/\/doi.org\/10.1007\/s11192-007-1661-8","journal-title":"Scientometrics"},{"key":"5_CR11","doi-asserted-by":"publisher","unstructured":"Devlin, J., Chang, M.W., Lee, K., Toutanova, K.: BERT: pre-training of deep bidirectional transformers for language understanding. In: Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, vol. 1, pp. 4171\u20134186. Association for Computational Linguistics, Minneapolis, Minnesota (2019). https:\/\/doi.org\/10.18653\/v1\/n19-1423, long and short papers","DOI":"10.18653\/v1\/n19-1423"},{"issue":"3","key":"5_CR12","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0281659","volume":"18","author":"P Eckmann","year":"2023","unstructured":"Eckmann, P., Bandrowski, A.: PreprintMatch: a tool for preprint to publication detection shows global inequities in scientific publication. PLoS ONE 18(3), e0281659 (2023). https:\/\/doi.org\/10.1371\/journal.pone.0281659","journal-title":"PLoS ONE"},{"key":"5_CR13","unstructured":"Elsevier B.V: Scopus. https:\/\/www.scopus.com\/home.uri. Accessed 22 May 2023"},{"key":"5_CR14","unstructured":"Elsevier B.V: Social Science Research Network (SSRN): Tomorrow\u2019s research today. https:\/\/www.ssrn.com\/index.cfm\/en\/. Accessed 22 May 2023"},{"key":"5_CR15","unstructured":"Feldman, S., Lo, K., Ammar, W.: Citation count analysis for papers with preprints. Preprint (2018). arXiv: 1805.05238v1 [cs.DL]"},{"key":"5_CR16","doi-asserted-by":"publisher","unstructured":"Fraser, N.C., Momeni, F., Mayr, P., Peters, I.: The relationship between bioRxiv preprints, citations and altmetrics. Quant. Sci. Stud. 1(2), 618 \u2013 638 (2020). https:\/\/doi.org\/10.1162\/qss_a_00043","DOI":"10.1162\/qss_a_00043"},{"key":"5_CR17","doi-asserted-by":"publisher","unstructured":"Fu, D.Y., Hughey, J.J.: Meta-research: releasing a preprint is associated with more attention and citations for the peer-reviewed article. eLife 8, e52646 (2019). https:\/\/doi.org\/10.7554\/eLife.52646","DOI":"10.7554\/eLife.52646"},{"issue":"4","key":"5_CR18","doi-asserted-by":"publisher","first-page":"390","DOI":"10.1063\/1.4823313","volume":"8","author":"P Ginsparg","year":"1994","unstructured":"Ginsparg, P.: First steps towards electronic research communication. Comput. Phys. 8(4), 390\u2013396 (1994). https:\/\/doi.org\/10.1063\/1.4823313","journal-title":"Comput. Phys."},{"issue":"7359","key":"5_CR19","doi-asserted-by":"publisher","first-page":"145","DOI":"10.1038\/476145a","volume":"476","author":"P Ginsparg","year":"2011","unstructured":"Ginsparg, P.: ArXiv at 20. Nature 476(7359), 145\u2013147 (2011). https:\/\/doi.org\/10.1038\/476145a","journal-title":"Nature"},{"key":"5_CR20","unstructured":"Google Scholar: Google scholar. https:\/\/scholar.google.com\/. Accessed 22 May 2023"},{"key":"5_CR21","doi-asserted-by":"publisher","unstructured":"Hails, A.J., Day, A.R.: The SAGE rejected article tracker. J. Open Source Softw. 6(64), 3348 (2021). https:\/\/doi.org\/10.21105\/joss.03348","DOI":"10.21105\/joss.03348"},{"key":"5_CR22","unstructured":"Humanities Commons: Humanities Commons. https:\/\/hcommons.org\/. Accessed 22 May 2023"},{"key":"5_CR23","doi-asserted-by":"publisher","unstructured":"Jaccard, P.: The distribution of the flora in the alpine zone.1. New Phytologist 11(2), 37\u201350 (1912). https:\/\/doi.org\/10.1111\/j.1469-8137.1912.tb05611.x","DOI":"10.1111\/j.1469-8137.1912.tb05611.x"},{"issue":"1","key":"5_CR24","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1145\/3274784.3274787","volume":"52","author":"D Kelly","year":"2018","unstructured":"Kelly, D.: SIGIR community survey on preprint services. SIGIR Forum 52(1), 11\u201333 (2018). https:\/\/doi.org\/10.1145\/3274784.3274787","journal-title":"SIGIR Forum"},{"key":"5_CR25","unstructured":"Kinney, R.M., et al.: The semantic scholar open data platform. Preprint (2023). arXiv: 2301.10140v1 [cs.DL]"},{"key":"5_CR26","doi-asserted-by":"publisher","unstructured":"Larivi\u00e8re, V., Sugimoto, C.R., Macaluso, B., Milojevi\u0107, S., Cronin, B., Thelwall, M.: $${\\rm ArXiv}$$ e-prints and the journal of record: an analysis of roles and relationships. Journal of the Association for Information Science and Technology 65(6), 1157\u20131169 (2014). https:\/\/doi.org\/10.1002\/asi.23044","DOI":"10.1002\/asi.23044"},{"key":"5_CR27","first-page":"707","volume":"10","author":"VI Levenshtein","year":"1966","unstructured":"Levenshtein, V.I.: Binary codes capable of correcting deletions, insertions and reversals. Soviet Phys. Doklady 10, 707\u2013710 (1966)","journal-title":"Soviet Phys. Doklady"},{"key":"5_CR28","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/3-540-45735-6_1","volume-title":"String Processing and Information Retrieval","author":"M Ley","year":"2002","unstructured":"Ley, M.: The DBLP computer science bibliography: evolution, research issues, perspectives. In: Laender, A.H.F., Oliveira, A.L. (eds.) SPIRE 2002. LNCS, vol. 2476, pp. 1\u201310. Springer, Heidelberg (2002). https:\/\/doi.org\/10.1007\/3-540-45735-6_1"},{"key":"5_CR29","doi-asserted-by":"publisher","unstructured":"Lin, J., Yu, Y., Zhou, Y., Zhou, Z., Shi, X.: How many preprints have actually been printed and why: a case study of computer science preprints on $${\\rm arXiv.}$$ Scientometrics 124(1), 555\u2013574 (2020). https:\/\/doi.org\/10.1007\/s11192-020-03430-8","DOI":"10.1007\/s11192-020-03430-8"},{"issue":"11","key":"5_CR30","doi-asserted-by":"publisher","first-page":"1776","DOI":"10.1002\/asi.20888","volume":"59","author":"C Lis\u00e9e","year":"2008","unstructured":"Lis\u00e9e, C., Larivi\u00e8re, V., Archambault, E.: Conference proceedings as a source of scientific information: a bibliometric analysis. J. Am. Soc. Inform. Sci. Technol. 59(11), 1776\u20131784 (2008). https:\/\/doi.org\/10.1002\/asi.20888","journal-title":"J. Am. Soc. Inform. Sci. Technol."},{"key":"5_CR31","doi-asserted-by":"publisher","unstructured":"Lo, K., Wang, L.L., Neumann, M.E., Kinney, R.M., Weld, D.S.: S2ORC: the semantic scholar open research corpus. In: Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, pp. 4969\u20134983 (2020). https:\/\/doi.org\/10.18653\/v1\/2020.acl-main.447","DOI":"10.18653\/v1\/2020.acl-main.447"},{"key":"5_CR32","doi-asserted-by":"publisher","unstructured":"Moskovic, M.: The INSPIRE REST API. API documentation (2021). https:\/\/doi.org\/10.5281\/zenodo.5788550. https:\/\/github.com\/inspirehep\/rest-api-doc","DOI":"10.5281\/zenodo.5788550"},{"key":"5_CR33","unstructured":"Priem, J., Piwowar, H.A., Orr, R.: OpenAlex: A fully-open index of scholarly works, authors, venues, institutions, and concepts. Preprint (2022), arXiv: 2205.01833v2 [cs.DL]"},{"issue":"1","key":"5_CR34","doi-asserted-by":"publisher","first-page":"13","DOI":"10.6087\/kcse.2014.1.13","volume":"1","author":"L Rachael","year":"2014","unstructured":"Rachael, L.: CrossRef developments and initiatives: an update on services for the scholarly publishing community from CrossRef. Science Editing 1(1), 13\u201318 (2014). https:\/\/doi.org\/10.6087\/kcse.2014.1.13","journal-title":"Science Editing"},{"key":"5_CR35","doi-asserted-by":"publisher","unstructured":"Rawlinson, C., Bloom, T.: New preprint server for medical research. BMJ 365 (2019). https:\/\/doi.org\/10.1136\/bmj.l2301","DOI":"10.1136\/bmj.l2301"},{"issue":"4","key":"5_CR36","doi-asserted-by":"publisher","first-page":"402","DOI":"10.1001\/jama.2017.21168","volume":"319","author":"S Serghiou","year":"2018","unstructured":"Serghiou, S., Ioannidis, J.P.A.: Altmetric scores, citations, and publication of studies posted as preprints. JAMA 319(4), 402\u2013404 (2018). https:\/\/doi.org\/10.1001\/jama.2017.21168","journal-title":"JAMA"},{"key":"5_CR37","doi-asserted-by":"publisher","unstructured":"Sever, R., Roeder, T., Hindle, S., Sussman, L., Black, K.J., Argentine, J., Manos, W., Inglis, J.R.: bioRxiv: the preprint server for biology. Preprint (2019). https:\/\/doi.org\/10.1101\/833400","DOI":"10.1101\/833400"},{"key":"5_CR38","unstructured":"Sutton, C., Gong, L.: Popularity of arXiv$${.}$$org within computer science. Preprint (2017), arXiv: 1710.05225v1 [cs.DL]"}],"container-title":["Lecture Notes in Computer Science","Linking Theory and Practice of Digital Libraries"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-43849-3_5","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,13]],"date-time":"2024-03-13T15:44:58Z","timestamp":1710344698000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-43849-3_5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"ISBN":["9783031438486","9783031438493"],"references-count":38,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-43849-3_5","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2023]]},"assertion":[{"value":"22 September 2023","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"TPDL","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Theory and Practice of Digital Libraries","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Zadar","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Croatia","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2023","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26 September 2023","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2023","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"27","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"tpdl2023","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/tpdl2023.dei.unipd.it\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Single-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Microsoft CMT","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"69","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"13","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"17","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"19% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"2","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3 invited papers","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}