{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,18]],"date-time":"2025-12-18T19:35:54Z","timestamp":1766086554043,"version":"3.37.0"},"publisher-location":"Berlin, Heidelberg","reference-count":28,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642041730"},{"type":"electronic","value":"9783642041747"}],"license":[{"start":{"date-parts":[[2009,1,1]],"date-time":"2009-01-01T00:00:00Z","timestamp":1230768000000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2009]]},"DOI":"10.1007\/978-3-642-04174-7_23","type":"book-chapter","created":{"date-parts":[[2009,8,27]],"date-time":"2009-08-27T00:52:46Z","timestamp":1251334366000},"page":"350-365","source":"Crossref","is-referenced-by-count":6,"title":["Identifying the Original Contribution of a Document via Language Modeling"],"prefix":"10.1007","author":[{"given":"Benyah","family":"Shaparenko","sequence":"first","affiliation":[]},{"given":"Thorsten","family":"Joachims","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"23_CR1","unstructured":"Mei, Q., Zhai, C.: Generating impact-based summaries for scientific literature. In: Proceedings of the Association for Computational Linguistics (ACL), pp. 816\u2013824 (2008)"},{"key":"23_CR2","doi-asserted-by":"crossref","unstructured":"Soboroff, I., Harman, D.: Overview of the TREC 2003 novelty track. In: Proceedings of the Text Retrieval Conference, TREC (2003)","DOI":"10.6028\/NIST.SP.500-255.novelty-overview"},{"key":"23_CR3","unstructured":"NIST: Document Understanding Conferences (DUC), http:\/\/duc.nist.gov\/"},{"key":"23_CR4","unstructured":"Allan, J., Carbonell, J., Doddington, G., Yamron, J., Yang, Y.: Topic detection and tracking pilot study: Final report. In: Proceedings of the DARPA Broadcast News Transcription and Understanding Workshop (1998)"},{"key":"23_CR5","doi-asserted-by":"crossref","unstructured":"Allan, J., Papka, R., Lavrenko, V.: On-line new event detection and tracking. In: Proceedings of the SIGIR Conference on Research and Development in Information Retrieval, pp. 37\u201345 (1998)","DOI":"10.1145\/290941.290954"},{"issue":"5","key":"23_CR6","first-page":"993","volume":"3","author":"D. Blei","year":"2003","unstructured":"Blei, D., Ng, A., Jordan, M.: Latent dirichlet allocation. Journal of Machine Learning Research (JMLR)\u00a03(5), 993\u20131022 (2003)","journal-title":"Journal of Machine Learning Research (JMLR)"},{"key":"23_CR7","unstructured":"Blei, D., Griffiths, T., Jordan, M., Tenenbaum, J.: Hierarchical topic models and the nested chinese restaurant process. In: Proceedings of the Conference on Advances in Neural Information Processing Systems, NIPS (2003)"},{"key":"23_CR8","unstructured":"Blei, D., Lafferty, J.: Correlated topic models. In: Proceedings of the Conference on Advances in Neural Information Processing Systems, NIPS (2005)"},{"key":"23_CR9","doi-asserted-by":"crossref","unstructured":"Blei, D.M., Lafferty, J.D.: Dynamic topic models. In: Proceedings of the International Conference on Machine Learning (ICML), pp. 113\u2013120 (2006)","DOI":"10.1145\/1143844.1143859"},{"key":"23_CR10","doi-asserted-by":"crossref","unstructured":"Hofmann, T.: Probabilistic latent semantic analysis. In: Proceedings of the Conference on Uncertainty in Artificial Inteligence, UAI (1999)","DOI":"10.1145\/312624.312649"},{"key":"23_CR11","doi-asserted-by":"crossref","unstructured":"Mann, G., Mimno, D., McCallum, A.: Bibliometric impact measures leveraging topic analysis. In: Proceedings of the Joint Conference on Digital Libraries, JCDL (2006)","DOI":"10.1145\/1141753.1141765"},{"key":"23_CR12","doi-asserted-by":"crossref","unstructured":"Wang, X., McCallum, A.: Topics over time: A non-markov continuous-time model of topical trends. In: Proceedings of the Conference on Knowledge Discovery and Data Mining (KDD), pp. 424\u2013433 (2006)","DOI":"10.1145\/1150402.1150450"},{"key":"23_CR13","doi-asserted-by":"crossref","unstructured":"Steyvers, M., Smyth, P., Rosen-Zvi, M., Griffiths, T.: Probabilistic author-topic models for information discovery. In: Proceedings of the Conference on Knowledge Discovery and Data Mining (KDD), pp. 306\u2013315 (2004)","DOI":"10.1145\/1014052.1014087"},{"key":"23_CR14","unstructured":"Griffiths, T., Steyvers, M.: A probabilistic approach to semantic representation. In: Proceedings of the Annual Conference of the Cognitive Science Society (2002)"},{"key":"23_CR15","doi-asserted-by":"crossref","unstructured":"Dietz, L., Bickel, S., Scheffer, T.: Unsupervised prediction of citation influences. In: Proceedings of the International Conference on Machine Learning (ICML), pp. 233\u2013240 (2007)","DOI":"10.1145\/1273496.1273526"},{"key":"23_CR16","unstructured":"McCallum, A., Corrada-Emanuel, A., Wang, X.: Topic and role discovery in social networks. In: Proceedings of International Joint Conference on Artificial Intelligence, IJCAI (2005)"},{"key":"23_CR17","doi-asserted-by":"crossref","unstructured":"Mei, Q., Ling, X., Wondra, M., Su, H., Zhai, C.: Topic sentiment mixture: Modeling facets and opinions in weblogs. In: Proceedings of the World Wide Web Conference (WWW), pp. 171\u2013180 (2007)","DOI":"10.1145\/1242572.1242596"},{"key":"23_CR18","doi-asserted-by":"crossref","unstructured":"Li, W., McCallum, A.: Pachinko allocation: Dag-structured mixture models of topic correlations. In: Proceedings of the International Conference on Machine Learning, ICML (2006)","DOI":"10.1145\/1143844.1143917"},{"key":"23_CR19","unstructured":"Wang, X., Li, W., McCallum, A.: A continuous-time model of topic co-occurrence trends. In: AAAI Workshop on Event Detection (2006)"},{"key":"23_CR20","unstructured":"Griffiths, T., Steyvers, M., Blei, D., Tenenbaum, J.: Integrating topics and syntax. In: Proceedings of the Conference on Advances in Neural Information Processing Systems, NIPS (2004)"},{"key":"23_CR21","doi-asserted-by":"crossref","unstructured":"Shaparenko, B., Joachims, T.: Information genealogy: Uncovering the flow of ideas in non-hyperlinked document databases. In: Proceedings of the Conference on Knowledge Discovery and Data Mining (KDD), pp. 619\u2013628 (2007)","DOI":"10.1145\/1281192.1281259"},{"key":"23_CR22","volume-title":"Foundations of Statistical Natural Language Processing","author":"C.D. Manning","year":"1999","unstructured":"Manning, C.D., Schuetze, H.: Foundations of Statistical Natural Language Processing. MIT Press, Cambridge (1999)"},{"key":"23_CR23","first-page":"57","volume-title":"Statistical Methods for Speech Recognition","author":"F. Jelinek","year":"1998","unstructured":"Jelinek, F.: Basic Language Modeling. In: Statistical Methods for Speech Recognition, pp. 57\u201378. MIT Press, Cambridge (1998)"},{"key":"23_CR24","doi-asserted-by":"crossref","unstructured":"Zhai, C.: Risk Minimization and Language Modeling in Information Retrieval. PhD thesis, Carnegie Mellon University (2002)","DOI":"10.1145\/792550.792571"},{"key":"23_CR25","doi-asserted-by":"crossref","unstructured":"Kurland, O., Lee, L.: Corpus structure, language models, and ad hoc information retrieval. In: Proceedings of the SIGIR Conference on Research and Development in Information Retrieval, pp. 194\u2013201 (2004)","DOI":"10.1145\/1008992.1009027"},{"key":"23_CR26","doi-asserted-by":"crossref","unstructured":"Kurland, O., Lee, L.: Respect my authority! hits without hyperlinks, utilizing cluster-based language models. In: Proceedings of the SIGIR Conference on Research and Development in Information Retrieval, pp. 83\u201390 (2006)","DOI":"10.1145\/1148170.1148188"},{"key":"23_CR27","unstructured":"MOSEK: http:\/\/www.mosek.com\/index.html"},{"key":"23_CR28","unstructured":"NIPS Online: The Text Repository, http:\/\/nips.djvuzone.org\/txt.html"}],"container-title":["Lecture Notes in Computer Science","Machine Learning and Knowledge Discovery in Databases"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-04174-7_23","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,2,11]],"date-time":"2025-02-11T21:46:53Z","timestamp":1739310413000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-04174-7_23"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009]]},"ISBN":["9783642041730","9783642041747"],"references-count":28,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-04174-7_23","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2009]]}}}