{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,31]],"date-time":"2025-10-31T22:06:26Z","timestamp":1761948386303,"version":"3.37.3"},"reference-count":25,"publisher":"Springer Science and Business Media LLC","issue":"6","license":[{"start":{"date-parts":[[2018,6,30]],"date-time":"2018-06-30T00:00:00Z","timestamp":1530316800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0"}],"funder":[{"DOI":"10.13039\/501100002428","name":"Austrian Science Fund","doi-asserted-by":"publisher","award":["P25905-N23 (ADmIRE)"],"award-info":[{"award-number":["P25905-N23 (ADmIRE)"]}],"id":[{"id":"10.13039\/501100002428","id-type":"DOI","asserted-by":"publisher"}]},{"name":"EU-ROSTARS","award":["FFG 852624 (Self-Optimizer)"],"award-info":[{"award-number":["FFG 852624 (Self-Optimizer)"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Inf Retrieval J"],"published-print":{"date-parts":[[2018,12]]},"DOI":"10.1007\/s10791-018-9334-1","type":"journal-article","created":{"date-parts":[[2018,6,30]],"date-time":"2018-06-30T02:08:23Z","timestamp":1530324503000},"page":"565-596","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["A systematic approach to normalization in probabilistic models"],"prefix":"10.1007","volume":"21","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-3643-6493","authenticated-orcid":false,"given":"Aldo","family":"Lipani","sequence":"first","affiliation":[]},{"given":"Thomas","family":"Roelleke","sequence":"additional","affiliation":[]},{"given":"Mihai","family":"Lupu","sequence":"additional","affiliation":[]},{"given":"Allan","family":"Hanbury","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,6,30]]},"reference":[{"key":"9334_CR1","unstructured":"Amati, G., & Kerpedjiev, S. (1992). An information retrieval logic model: Implementation and experiments. Tech. Rep. REL 5b04892, Fondazione Ugo Bordoni, Rome, Italy."},{"issue":"4","key":"9334_CR2","doi-asserted-by":"publisher","first-page":"357","DOI":"10.1145\/582415.582416","volume":"20","author":"G Amati","year":"2002","unstructured":"Amati, G., & Van Rijsbergen, C. J. (2002). Probabilistic models of information retrieval based on measuring the divergence from randomness. ACM Transactions on Information Systems, 20(4), 357\u2013389. \n                    https:\/\/doi.org\/10.1145\/582415.582416\n                    \n                  .","journal-title":"ACM Transactions on Information Systems"},{"key":"9334_CR3","doi-asserted-by":"publisher","first-page":"283","DOI":"10.1007\/978-94-017-2390-9_18","volume-title":"Text, Speech and Language Technology","author":"K. Church","year":"1999","unstructured":"Church, K., & Gale, W. (1999). Inverse document frequency (IDF): A measure of deviations from poisson (pp. 283\u2013295). Dordrecht: Springer. \n                    https:\/\/doi.org\/10.1007\/978-94-017-2390-9_18\n                    \n                  ."},{"key":"9334_CR4","doi-asserted-by":"publisher","unstructured":"Fang, H., Tao, T., & Zhai, C. (2004). A formal study of information retrieval heuristics. In Proceedings of the 27th annual international ACM SIGIR conference on research and development in information retrieval, SIGIR \u201904 (pp. 49\u201356). New York, NY, USA: ACM. \n                    https:\/\/doi.org\/10.1145\/1008992.1009004\n                    \n                  .","DOI":"10.1145\/1008992.1009004"},{"key":"9334_CR5","unstructured":"Hanbury, A., & Lupu, M. (2013). Toward a model of domain-specific search. In Proceedings of the 10th conference on open research areas in information retrieval, OAIR \u201913 (pp. 33\u201336). Paris, France: CID."},{"key":"9334_CR6","doi-asserted-by":"publisher","unstructured":"HE, B., & Ounis, I. (2003). A study of parameter tuning for term frequency normalization. In Proceedings of the twelfth international conference on information and knowledge management, CIKM \u201903 (pp. 10\u201316). New York, NY, USA: ACM. \n                    https:\/\/doi.org\/10.1145\/956863.956867\n                    \n                  .","DOI":"10.1145\/956863.956867"},{"key":"9334_CR7","doi-asserted-by":"publisher","unstructured":"He, B., & Ounis, I. (2005a). A study of the dirichlet priors for term frequency normalisation. In Proceedings of the 28th annual international ACM SIGIR conference on research and development in information retrieval, SIGIR \u201905 (pp. 465\u2013471). New York, NY, USA: ACM. \n                    https:\/\/doi.org\/10.1145\/1076034.1076114\n                    \n                  .","DOI":"10.1145\/1076034.1076114"},{"key":"9334_CR8","doi-asserted-by":"publisher","first-page":"200","DOI":"10.1007\/978-3-540-31865-1_15","volume-title":"Lecture Notes in Computer Science","author":"Ben He","year":"2005","unstructured":"He, B., & Ounis, I. (2005b). Term frequency normalisation tuning for BM25 and DFR models (pp. 200\u2013214). Heidelberg, Berlin: Springer. \n                    https:\/\/doi.org\/10.1007\/978-3-540-31865-1_15\n                    \n                  ."},{"key":"9334_CR9","unstructured":"Knaus, D., Mittendorf, E., & Schauble, P. (1994). Improving a basic retrieval method by links and passage level evidence. In Proceedings of the 3rd text REtrieval conference (pp. 241\u2013241)."},{"key":"9334_CR10","doi-asserted-by":"publisher","unstructured":"Lipani, A., Lupu, M., Hanbury, A., & Aizawa, A. (2015). Verboseness fission for bm25 document length normalization. In Proceedings of the 2015 international conference on the theory of information retrieval, ICTIR \u201915 (pp. 385\u2013388). New York, NY, USA: ACM. \n                    https:\/\/doi.org\/10.1145\/2808194.2809486\n                    \n                  .","DOI":"10.1145\/2808194.2809486"},{"key":"9334_CR11","doi-asserted-by":"publisher","unstructured":"Lv, Y., & Zhai, C. (2011a). Adaptive term frequency normalization for bm25. In Proceedings of the 20th ACM International Conference on Information and Knowledge Management, CIKM \u201911 (pp. 1985\u20131988). New York, NY, USA: ACM. \n                    https:\/\/doi.org\/10.1145\/2063576.2063871\n                    \n                  .","DOI":"10.1145\/2063576.2063871"},{"key":"9334_CR12","doi-asserted-by":"publisher","unstructured":"Lv, Y., & Zhai, C. (2011b). Lower-bounding term frequency normalization. In Proceedings of the 20th ACM international conference on information and knowledge management, CIKM \u201911 (pp. 7\u201316). New York, NY, USA: ACM. \n                    https:\/\/doi.org\/10.1145\/2063576.2063584\n                    \n                  .","DOI":"10.1145\/2063576.2063584"},{"key":"9334_CR13","doi-asserted-by":"publisher","unstructured":"Lv, Y., & Zhai, C. (2011c). When documents are very long, bm25 fails! In Proceedings of the 34th international ACM SIGIR conference on research and development in information retrieval, SIGIR \u201911 (pp. 1103\u20131104). New York, NY, USA: ACM. \n                    https:\/\/doi.org\/10.1145\/2009916.2010070\n                    \n                  .","DOI":"10.1145\/2009916.2010070"},{"key":"9334_CR14","doi-asserted-by":"publisher","unstructured":"Metzler, D. (2008). Generalized inverse document frequency. In Proceedings of the 17th ACM conference on information and knowledge management, CIKM \u201908 (pp. 399\u2013408). New York, NY, USA: ACM. \n                    https:\/\/doi.org\/10.1145\/1458082.1458137\n                    \n                  . \n                    http:\/\/doi.acm.org\/10.1145\/1458082.1458137\n                    \n                  .","DOI":"10.1145\/1458082.1458137"},{"key":"9334_CR15","doi-asserted-by":"publisher","unstructured":"Na, S. H., Kang, I. S., & Lee, J. H. (2008). Improving term frequency normalization for multi-topical documents and application to language modeling approaches (pp. 382\u2013393). Berlin, Heidelberg: Springer. \n                    https:\/\/doi.org\/10.1007\/978-3-540-78646-7_35\n                    \n                  .","DOI":"10.1007\/978-3-540-78646-7_35"},{"key":"9334_CR17","unstructured":"Robertson, S. E., & Walker, S. (1999). Okapi\/keenbow at TREC-8. In Proceedings of the 8th text REtrieval conference (Vol.\u00a08, pp. 151\u2013162)."},{"key":"9334_CR18","unstructured":"Robertson, S. E., Walker, S., Jones, S., Hancock-Beaulieu, M., & Gatford, M. (1994). Okapi at TREC-3. In Proceedings of the 3rd text REtrieval conference (Vol.\u00a03, pp. 109\u2013126)."},{"issue":"4","key":"9334_CR16","doi-asserted-by":"publisher","first-page":"333","DOI":"10.1561\/1500000019","volume":"3","author":"S Robertson","year":"2009","unstructured":"Robertson, S., & Zaragoza, H. (2009). The probabilistic relevance framework: Bm25 and beyond. Foundations and Trends\u00aein. Information Retrieval, 3(4), 333\u2013389. \n                    https:\/\/doi.org\/10.1561\/1500000019\n                    \n                  .","journal-title":"Information Retrieval"},{"issue":"3","key":"9334_CR19","doi-asserted-by":"publisher","first-page":"1","DOI":"10.2200\/S00494ED1V01Y201304ICR027","volume":"5","author":"Thomas Roelleke","year":"2013","unstructured":"Roelleke, T. (2013). Information retrieval models: Foundations and relationships. \n                    https:\/\/doi.org\/10.2200\/S00494ED1V01Y201304ICR027\n                    \n                  .","journal-title":"Synthesis Lectures on Information Concepts, Retrieval, and Services"},{"issue":"11","key":"9334_CR20","doi-asserted-by":"publisher","first-page":"2982","DOI":"10.1093\/comjnl\/bxv031","volume":"58","author":"T Roelleke","year":"2015","unstructured":"Roelleke, T., Kaltenbrunner, A., & Baeza-Yates, R. (2015). Harmony assumptions in information retrieval and social networks. The Computer Journal, 58(11), 2982. \n                    https:\/\/doi.org\/10.1093\/comjnl\/bxv031\n                    \n                  .","journal-title":"The Computer Journal"},{"key":"9334_CR21","doi-asserted-by":"publisher","unstructured":"Roelleke, T., & Wang, J. (2008). Tf-idf uncovered: A study of theories and probabilities. In Proceedings of the 31st annual international ACM SIGIR conference on research and development in information retrieval, SIGIR \u201908 (pp. 435\u2013442). New York, NY, USA: ACM. \n                    https:\/\/doi.org\/10.1145\/1390334.1390409\n                    \n                  .","DOI":"10.1145\/1390334.1390409"},{"key":"9334_CR22","doi-asserted-by":"publisher","unstructured":"Rousseau, F., & Vazirgiannis, M. (2013). Composition of tf normalizations: New insights on scoring functions for ad hoc ir. In Proceedings of the 36th international ACM SIGIR conference on research and development in information retrieval, SIGIR \u201913 (pp. 917\u2013920). New York, NY, USA: ACM. \n                    https:\/\/doi.org\/10.1145\/2484028.2484121\n                    \n                  .","DOI":"10.1145\/2484028.2484121"},{"issue":"5","key":"9334_CR23","doi-asserted-by":"publisher","first-page":"513","DOI":"10.1016\/0306-4573(88)90021-0","volume":"24","author":"Gerard Salton","year":"1988","unstructured":"Salton, G., & Buckley, C. (1988). Term-weighting approaches in automatic text retrieval. Information Processing & Management, 24(5), 513\u2013523. \n                    https:\/\/doi.org\/10.1016\/0306-4573(88)90021-0\n                    \n                  .","journal-title":"Information Processing & Management"},{"key":"9334_CR24","doi-asserted-by":"publisher","unstructured":"Singhal, A., Buckley, C., & Mitra, M. (1996). Pivoted document length normalization. In Proceedings of the 19th annual international ACM SIGIR conference on research and development in information retrieval, SIGIR \u201996 (pp. 21\u201329). New York, NY, USA: ACM. \n                    https:\/\/doi.org\/10.1145\/243199.243206\n                    \n                  .","DOI":"10.1145\/243199.243206"},{"key":"9334_CR25","doi-asserted-by":"publisher","unstructured":"Zhai, C., & Lafferty, J. (2001). A study of smoothing methods for language models applied to ad hoc information retrieval. In Proceedings of the 24th annual international ACM SIGIR conference on research and development in information retrieval, SIGIR \u201901 (pp. 334\u2013342). New York, NY, USA: ACM. \n                    https:\/\/doi.org\/10.1145\/383952.384019\n                    \n                  .","DOI":"10.1145\/383952.384019"}],"container-title":["Information Retrieval Journal"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10791-018-9334-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10791-018-9334-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10791-018-9334-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,9,22]],"date-time":"2019-09-22T04:42:47Z","timestamp":1569127367000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10791-018-9334-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,6,30]]},"references-count":25,"journal-issue":{"issue":"6","published-print":{"date-parts":[[2018,12]]}},"alternative-id":["9334"],"URL":"https:\/\/doi.org\/10.1007\/s10791-018-9334-1","relation":{},"ISSN":["1386-4564","1573-7659"],"issn-type":[{"type":"print","value":"1386-4564"},{"type":"electronic","value":"1573-7659"}],"subject":[],"published":{"date-parts":[[2018,6,30]]},"assertion":[{"value":"19 June 2017","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 June 2018","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 June 2018","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}