{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,20]],"date-time":"2025-10-20T17:47:27Z","timestamp":1760982447913},"reference-count":32,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2007,12,20]],"date-time":"2007-12-20T00:00:00Z","timestamp":1198108800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2007,12,20]],"date-time":"2007-12-20T00:00:00Z","timestamp":1198108800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Inf Retrieval"],"published-print":{"date-parts":[[2008,4]]},"DOI":"10.1007\/s10791-007-9040-x","type":"journal-article","created":{"date-parts":[[2007,12,19]],"date-time":"2007-12-19T15:08:59Z","timestamp":1198076939000},"page":"109-138","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":33,"title":["An analysis on document length retrieval trends in language modeling smoothing"],"prefix":"10.1007","volume":"11","author":[{"given":"David E.","family":"Losada","sequence":"first","affiliation":[]},{"given":"Leif","family":"Azzopardi","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2007,12,20]]},"reference":[{"key":"9040_CR1","doi-asserted-by":"crossref","unstructured":"Allan, J. (2005). HARD track overview in TREC 2005 high accuracy retrieval from documents. In Proceedings of the 14th Text Retrieval Conference (TREC 2005).","DOI":"10.21236\/ADA439446"},{"key":"9040_CR2","unstructured":"Amati, G. (2003). Divergence from randomness. Ph.D. thesis, Department of Computer Science, University of Glasgow."},{"issue":"4","key":"9040_CR3","doi-asserted-by":"publisher","first-page":"357","DOI":"10.1145\/582415.582416","volume":"20","author":"G. Amati","year":"2002","unstructured":"Amati, G., & van Rijsbergen, C. (2002). Probabilistic models of information retrieval based on measuring the divergence from randomness. ACM Transactions on Information Systems (TOIS), 20(4), 357\u2013389.","journal-title":"ACM Transactions on Information Systems (TOIS)"},{"key":"9040_CR4","unstructured":"Azzopardi, L. (2005) Incorporating context into the language modeling for ad hoc information retrieval. Ph.D. thesis, University of Paisley, Glasgow, UK."},{"key":"9040_CR5","unstructured":"Azzopardi, L., & Losada, D. E. (2007). Fairly retrieving documents of all lengths. In Proceedings of the First International Conference in Theory of Information Retrieval (ICTIR 2007) (pp. 65\u201376)."},{"key":"9040_CR6","unstructured":"Chen, S. F., & Goodman, J. (1998). An empirical study of smoothing techniques for language modeling. Technical report TR-10-98, Harvard University."},{"key":"9040_CR7","doi-asserted-by":"crossref","unstructured":"Chowdhury, A., McCabe, M. C., Grossman, D., & Frieder, O. (2002). Document normalization revisited. In Proceedings of the 25th ACM SIGIR Conference on Research and Development in Information Retrieval (pp. 381\u2013382). New York, NY: ACM Press.","DOI":"10.1145\/564376.564454"},{"key":"9040_CR8","doi-asserted-by":"crossref","unstructured":"Craswell, N., Robertson, S., Zaragoza, H., & Taylor, M. (2005). Relevance weighting for query independent evidence. In Proceedings of the 28th ACM Conference on Research and Development in Information Retrieval, SIGIR\u201905 (pp. 416\u2013423). Salvador, Brazil.","DOI":"10.1145\/1076034.1076106"},{"key":"9040_CR9","unstructured":"Harman, D. (2005). TREC: Experiment and Evaluation in Information Retrieval, Chap. The TREC AdHoc Experiments, pp. 79\u201397. The MIT Press."},{"key":"9040_CR10","doi-asserted-by":"crossref","unstructured":"Hauff, C., & Azzopardi, L. (2005). Age dependent document priors in link structure analysis. In D. Losada & J. M. Fernandez-Luna (Eds.), Proceedings of the 27th European Conference on Information Retrieval Research, ECIR\u20192005 (pp. 552\u2013554). Santiago de Compostela, Spain: Springer Verlag, LNCS 3408.","DOI":"10.1007\/978-3-540-31865-1_48"},{"key":"9040_CR11","doi-asserted-by":"crossref","unstructured":"Hiemstra, D. (1998). A linguistically motivated probabilistic model of information retrieval. In C. Nicolaou & C. Stephanidis (Eds.), Lecture Notes in Computer Science: Research and Advanced Technology for Digital Libraries, Vol. 1513 (pp. 569\u2013584).","DOI":"10.1007\/3-540-49653-X_34"},{"key":"9040_CR12","doi-asserted-by":"publisher","first-page":"131","DOI":"10.1007\/s007999900025","volume":"3","author":"D. Hiemstra","year":"2000","unstructured":"Hiemstra, D. (2000). A probabilistic justification for using tf x idf term weighting in information retrieval. International Journal of Digital Libraries, 3, 131\u2013139.","journal-title":"International Journal of Digital Libraries"},{"key":"9040_CR13","unstructured":"Jelinek, F., & Mercer, R. (1980). Interpolated estimation of Markov source parameters from sparse data. In Proceedings of the Workshop on Pattern Recognition in Practice. Amsterdam."},{"key":"9040_CR14","doi-asserted-by":"crossref","unstructured":"Kamps, J. (2005). Web-centric language models. In Proceedings of the ACM Conference on Information and Knowledge Management (CIKM).","DOI":"10.1145\/1099554.1099640"},{"key":"9040_CR15","unstructured":"Kraaij, W., & Westerveld, T. (2000). TNO\/UT at TREC-9: How different are web documents. In Proceedings of the TREC-9, the 9th Text Retrieval Conference. Gaithersburg, USA."},{"key":"9040_CR16","doi-asserted-by":"crossref","unstructured":"Kraaij, W., Westerveld, T., & Hiemstra, D. (2002). The importance of prior probabilities for entry page search. In Proceedings of the 25th ACM Conference on Research and Development in Information Retrieval, SIGIR\u201902 (pp. 27\u201334). Tampere, Finland.","DOI":"10.1145\/564376.564383"},{"key":"9040_CR17","unstructured":"Lemur. (2002). The Lemur toolkit. http:\/\/www.lemurproject.org"},{"issue":"3","key":"9040_CR18","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1017\/S1351324900000218","volume":"1","author":"D. Mackay","year":"1995","unstructured":"Mackay, D., & Peto, L. (1995). A hierarchical Dirichlet language model. Natural Language Engineering, 1(3), 1\u201319.","journal-title":"Natural Language Engineering"},{"key":"9040_CR19","unstructured":"Manning, C. D., & Sch\u00fctze, H. (1999). Foundations of statistical natural language processing. The MIT Press."},{"key":"9040_CR20","doi-asserted-by":"crossref","unstructured":"Miller, D., Leek, T., & Schwartz, R. (1999). A hidden markov movel information retrieval system. In Proceedings of the SIGIR-99, the 22nd ACM Conference on Research and Development in Information Retrieval (pp. 214\u2013221). Berkeley.","DOI":"10.1145\/312624.312680"},{"key":"9040_CR21","unstructured":"Ogilvie, P., & Callan, J. (2004). Experiments with language models for known-item finding of e-mail messages. In Proceedings of the 14th Text Retrieval Conference, TREC-2004."},{"key":"9040_CR22","doi-asserted-by":"crossref","unstructured":"Ponte, J., & Croft, W. B. (1998). A language modeling approach to information retrieval. In Proceedings of the 21st ACM Conference on Research and Development in Information Retrieval, SIGIR\u201998 (pp. 275\u2013281). Melbourne, Australia.","DOI":"10.1145\/290941.291008"},{"issue":"3","key":"9040_CR23","doi-asserted-by":"crossref","first-page":"130","DOI":"10.1108\/eb046814","volume":"14","author":"M. Porter","year":"1980","unstructured":"Porter, M. (1980). An algorithm for suffix stripping. Program, 14(3), 130\u2013137.","journal-title":"Program"},{"key":"9040_CR24","doi-asserted-by":"crossref","unstructured":"Robertson, S., & Walker, S. (1994). Some simple effective approximations to the 2-poisson model for probabilistic weighted retrieval. In Proceedings of the SIGIR-94, the 17th ACM Conference on Research and Development in Information Retrieval (pp. 232\u2013241). Dublin, Ireland.","DOI":"10.1007\/978-1-4471-2099-5_24"},{"key":"9040_CR25","unstructured":"Robertson, S., Walker, S., Jones, S., Hancock Beaulieu, M., & Gatford, M. (1995). Okapi at TREC-3. In Harman, D. (Ed.), Proceedings of the TREC-3, the 3rd Text Retrieval Conference (pp. 109\u2013127). NIST."},{"key":"9040_CR26","doi-asserted-by":"crossref","unstructured":"Sanderson, M., & Zobel, J. (2005). Information retrieval system evaluation: Effort, sensitivity, and reliability. In Proceedings  of the 28th ACM SIGIR Conference on Research and Development in Information Retrieval (pp. 162\u2013169).","DOI":"10.1145\/1076034.1076064"},{"key":"9040_CR27","doi-asserted-by":"crossref","unstructured":"Singhal, A., Buckley, C., & Mitra, M. (1996a). Pivoted document length normalization. In Proceedings of the 19th ACM SIGIR conference on Research and Development in Information Retrieval (pp. 21\u201329).","DOI":"10.1145\/243199.243206"},{"key":"9040_CR28","doi-asserted-by":"crossref","unstructured":"Singhal, A., Buckley, C., & Mitra, M. (1996b). Pivoted document length normalization. In Proceedings of the SIGIR-96, the 19th ACM Conference on Research and Development in Information Retrieval (pp. 21\u201329). Zurich, Switzerland.","DOI":"10.1145\/243199.243206"},{"key":"9040_CR29","doi-asserted-by":"crossref","unstructured":"Voorhees, E., & Harman, D. (1999). Overview of the eight text retrieval conference. In Proceedings of the TREC-8, the 8th text retrieval conference.","DOI":"10.6028\/NIST.SP.500-246"},{"key":"9040_CR30","doi-asserted-by":"crossref","unstructured":"Zhai, C., & Lafferty, J. (2001). A study of smoothing methods for language models applied to adhoc information retrieval. In Proceedings of the 24th ACM Conference on Research and Development in Information Retrieval, SIGIR\u201901 (pp. 334\u2013342). New Orleans, USA.","DOI":"10.1145\/383952.384019"},{"key":"9040_CR31","doi-asserted-by":"crossref","unstructured":"Zhai, C., & Lafferty, J. (2002). Two-stage language models for information retrieval. In Proceedings of the 25th ACM Conference on Research and Development in Information Retrieval, SIGIR\u201902 (pp. 49\u201356). Tampere, Finland.","DOI":"10.1145\/564376.564387"},{"issue":"2","key":"9040_CR32","doi-asserted-by":"publisher","first-page":"179","DOI":"10.1145\/984321.984322","volume":"22","author":"C. Zhai","year":"2004","unstructured":"Zhai, C., & Lafferty, J. (2004). A study of smoothing methods for language models applied to information retrieval. ACM Transactions on Information Systems, 22(2), 179\u2013214.","journal-title":"ACM Transactions on Information Systems"}],"container-title":["Information Retrieval"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10791-007-9040-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10791-007-9040-x\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10791-007-9040-x","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10791-007-9040-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,2]],"date-time":"2024-01-02T14:32:30Z","timestamp":1704205950000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10791-007-9040-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2007,12,20]]},"references-count":32,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2008,4]]}},"alternative-id":["9040"],"URL":"https:\/\/doi.org\/10.1007\/s10791-007-9040-x","relation":{},"ISSN":["1386-4564","1573-7659"],"issn-type":[{"value":"1386-4564","type":"print"},{"value":"1573-7659","type":"electronic"}],"subject":[],"published":{"date-parts":[[2007,12,20]]},"assertion":[{"value":"24 July 2007","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 December 2007","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 December 2007","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}