{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,20]],"date-time":"2025-10-20T18:09:07Z","timestamp":1760983747435},"reference-count":37,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2010,10,7]],"date-time":"2010-10-07T00:00:00Z","timestamp":1286409600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2010,10,7]],"date-time":"2010-10-07T00:00:00Z","timestamp":1286409600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Inf Retrieval"],"published-print":{"date-parts":[[2011,8]]},"DOI":"10.1007\/s10791-010-9147-3","type":"journal-article","created":{"date-parts":[[2010,10,6]],"date-time":"2010-10-06T12:16:01Z","timestamp":1286367361000},"page":"390-412","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":5,"title":["A multi-collection latent topic model for federated search"],"prefix":"10.1007","volume":"14","author":[{"given":"Mark","family":"Baillie","sequence":"first","affiliation":[]},{"given":"Mark","family":"Carman","sequence":"additional","affiliation":[]},{"given":"Fabio","family":"Crestani","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2010,10,7]]},"reference":[{"key":"9147_CR1","unstructured":"Asuncion, A., Smyth, P., & Welling, M. (2008). Asynchronous distributed learning of topic models. In  Neural information processing systems (NIPS\u201908) (pp. 81\u201388). Cambridge: MIT Press."},{"issue":"3","key":"9147_CR2","doi-asserted-by":"publisher","first-page":"347","DOI":"10.1002\/asi.20283","volume":"57","author":"T. T Avrahami","year":"2006","unstructured":"Avrahami, T. T, Yau, L., Si, L., & Callan, J. (2006). The fedlemur project: Federated search in the real world. Journal of the American Society for Information Science and Technology 57(3), 347\u2013358.","journal-title":"Journal of the American Society for Information Science and Technology"},{"issue":"2","key":"9147_CR3","doi-asserted-by":"publisher","first-page":"46","DOI":"10.1145\/1480506.1480515","volume":"42","author":"K. Balog","year":"2008","unstructured":"Balog, K. (2008). The SIGIR 2008 workshop on future challenges in expertise retrieval (fCHER). SIGIR Forum 42(2), 46\u201352.","journal-title":"SIGIR Forum"},{"key":"9147_CR4","doi-asserted-by":"crossref","unstructured":"Bar-Yossef, Z., & Gurevich, M. (2006). Random sampling from a search engine\u2019s index. In WWW\u201906: Proceedings of the 15th international conference on world wide web (pp. 367\u2013376). New York: ACM.","DOI":"10.1145\/1135777.1135833"},{"key":"9147_CR5","doi-asserted-by":"publisher","first-page":"17","DOI":"10.1214\/07-AOAS114","volume":"1","author":"D. M. Blei","year":"2007","unstructured":"Blei, D. M., & Lafferty, J. D. (2007). A correlated topic model of science. Annals of Applied \nStatistics 1, 17.","journal-title":"Annals of Applied Statistics"},{"key":"9147_CR6","doi-asserted-by":"publisher","first-page":"993","DOI":"10.1162\/jmlr.2003.3.4-5.993","volume":"3","author":"D. M. Blei","year":"2003","unstructured":"Blei, D. M., Ng, A. Y., & Jordan,  M. I. (2003). Latent dirichlet\u00a0allocation. Journal of Machine \nLearning Research 3, 993\u20131022.","journal-title":"Journal of Machine Learning Research"},{"key":"9147_CR7","doi-asserted-by":"crossref","first-page":"159","DOI":"10.1613\/jair.62","volume":"2","author":"W. L. Buntine","year":"1994","unstructured":"Buntine, W. L. (1994) Operations for learning with graphical models. Journal of Artificial \nIntelligence Research 2, 159\u2013225.","journal-title":"Journal of Artificial Intelligence Research"},{"key":"9147_CR8","doi-asserted-by":"crossref","unstructured":"Callan, J. P. (2000). Advances in information retrieval. In Distributed information retrieval (pp. 127\u2013150). Dordrecht: Kluwer Academic Publishers.","DOI":"10.1007\/0-306-47019-5_5"},{"issue":"2","key":"9147_CR9","doi-asserted-by":"publisher","first-page":"97","DOI":"10.1145\/382979.383040","volume":"19","author":"J. P. Callan","year":"2001","unstructured":"Callan, J. P., & Connell,  M. (2001). Query-based sampling of text databases. ACM Transactions \nof Information Systems 19(2), 97\u2013130.","journal-title":"ACM Transactions of Information Systems"},{"key":"9147_CR10","doi-asserted-by":"crossref","unstructured":"Callan, J. P., Lu, Z., & Croft, W. B. (1995). Searching distributed collections with inference networks. In SIGIR \u201995: Proceedings of the 18th annual international ACM SIGIR conference on research and development in information retrieval (pp. 21\u201328). New York: ACM Press.","DOI":"10.1145\/215206.215328"},{"key":"9147_CR11","unstructured":"Craswell, N., Crimmins, F., Hawking, D., & Moffat, A. (2004). Performance and cost tradeoffs in web search. In ADC\u201904: Proceedings of the 15th Australasian database conference (pp. 161\u2013169)."},{"key":"9147_CR12","doi-asserted-by":"crossref","unstructured":"Elsas, J. L., Arguello, J., Callan, J., & Carbonell, J. G. (2008). Retrieval and feedback models for blog feed search. In SIGIR \u201908: Proceedings of the 31st annual international ACM SIGIR conference on Research and development in information retrieval (pp. 347\u2013354). New York: ACM.","DOI":"10.1145\/1390334.1390394"},{"key":"9147_CR13","doi-asserted-by":"crossref","unstructured":"French, J. C., Powell, A. L., Viles, C. L., Emmitt, T., & Prey, K. J. (1998). Evaluating database selection techniques: A testbed and experiment. In SIGIR \u201998: Proceedings of the 21st annual international ACM SIGIR conference on research and development in information retrieval (pp. 121\u2013129). New York: ACM.","DOI":"10.1145\/290941.290976"},{"key":"9147_CR14","doi-asserted-by":"crossref","unstructured":"Gravano, L., Chang, C. C. K., Garcia-Molina, H., & Paepcke, A. (1997). Starts: Stanford proposal for internet meta-searching. In SIGMOD \u201997: Proceedings of the 1997 ACM SIGMOD international conference on management of data (pp. 207\u2013218). New York: ACM Press.","DOI":"10.1145\/253260.253299"},{"issue":"2","key":"9147_CR15","doi-asserted-by":"publisher","first-page":"229","DOI":"10.1145\/320248.320252","volume":"24","author":"L. Gravano","year":"1999","unstructured":"Gravano, L., Garc\u00eda-Molina, H., & Tomasic, A. (1999). GlOSS: Text-source discovery over the Internet. ACM Transactions on Database Systems 24(2), 229\u2013264.","journal-title":"ACM Transactions on Database Systems"},{"issue":"1","key":"9147_CR16","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/635484.635485","volume":"21","author":"L. Gravano","year":"2003","unstructured":"Gravano, L., Ipeirotis, P. G., & Sahami, M. (2003) Qprober: A system for automatic classification of hidden-web databases. ACM Transactions of Information Systems 21(1), 1\u201341.","journal-title":"ACM Transactions of Information Systems"},{"key":"9147_CR17","doi-asserted-by":"publisher","first-page":"5228","DOI":"10.1073\/pnas.0307752101","volume":"101","author":"T. L. Griffiths","year":"2004","unstructured":"Griffiths, T. L., & Steyvers, M. (2004). Finding scientific topics. Proceedings of the National \nAcademy of Science 101, 5228\u20135235.","journal-title":"Proceedings of the National Academy of Science"},{"key":"9147_CR18","doi-asserted-by":"crossref","unstructured":"Hawking, D., & Thomas, P. (2005). Server selection methods in hybrid portal search. In SIGIR \u201905: Proceedings of the 28th annual international ACM SIGIR conference on research and development in information retrieval (pp. 75\u201382). NY: ACM Press.","DOI":"10.1145\/1076034.1076050"},{"key":"9147_CR19","doi-asserted-by":"crossref","unstructured":"Hofmann, T. (1999). Probabilistic latent semantic indexing. In SIGIR \u201999: Proceedings of the 22nd annual international ACM SIGIR conference on research and development in information retrieval (pp. 50\u201357). NY: ACM.","DOI":"10.1145\/312624.312649"},{"issue":"2","key":"9147_CR20","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/1344411.1344412","volume":"26","author":"P. G. Ipeirotis","year":"2008","unstructured":"Ipeirotis, P. G., & Gravano, L. (2008). Classification-aware hidden-web text database selection. ACM Transactions of Information Systems 26(2), 1\u201366.","journal-title":"ACM Transactions of Information Systems"},{"key":"9147_CR21","doi-asserted-by":"crossref","unstructured":"Ipeirotis, P. G., Agichtein, E., Jain, P., & Gravano, L. (2006). To search or to crawl?: Towards a query optimizer for text-centric tasks. In SIGMOD \u201906: Proceedings of the 2006 ACM SIGMOD international conference on management of data (pp. 265\u2013276). New York: ACM Press.","DOI":"10.1145\/1142473.1142504"},{"key":"9147_CR22","doi-asserted-by":"crossref","unstructured":"Li, W., & McCallum, A. (2006), Pachinko allocation: DAG-structured mixture models of topic correlations. In ICML \u201906: Proceedings of the 23rd international conference on machine learning (pp. 577\u2013584). New York: ACM.","DOI":"10.1145\/1143844.1143917"},{"issue":"2","key":"9147_CR23","doi-asserted-by":"crossref","first-page":"1241","DOI":"10.14778\/1454159.1454163","volume":"1","author":"J. Madhavan","year":"2008","unstructured":"Madhavan, J., Ko, D., Kot, L., Ganapathy, V., Rasmussen, A., & Halevy, A. (2008). Google\u2019s deep web crawl. Proceedings of the VLDB Endowment 1(2), 1241\u20131252.","journal-title":"Proceedings of the VLDB Endowment"},{"key":"9147_CR24","doi-asserted-by":"crossref","DOI":"10.1017\/CBO9780511809071","volume-title":"Introduction to information retrieval","author":"C. D. Manning","year":"2008","unstructured":"Manning, C. D., Raghavan, P., & Schutze, H. (2008). Introduction to information retrieval. Cambridge: Cambridge University Press."},{"key":"9147_CR25","doi-asserted-by":"crossref","unstructured":"Paepcke, A., Brandriff, R., Janee, G., Larson, R., Ludaescher, B., Melnik, S., et al. (2000). Search middleware and the simple digital library interoperability protocol. D-Lib Magazine 6(3).","DOI":"10.1045\/march2000-paepcke"},{"key":"9147_CR26","volume-title":"The invisible web: Uncovering information sources search engines can\u2019t see","author":"G. Price","year":"2001","unstructured":"Price, G., & Sherman, C. (2001). The invisible web: Uncovering information sources search engines can\u2019t see. Medford: CyberAge Books."},{"issue":"2","key":"9147_CR27","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/1740592.1740593","volume":"28","author":"D. Puppin","year":"2010","unstructured":"Puppin, D., Silvestri, F., Perego, R., & Baeza-Yates, R. (2010). Tuning the capacity of search engines: Load-driven routing and incremental caching to reduce and balance the load. ACM Transactions on Information Systems (TOIS) 28(2), 1\u201336.","journal-title":"ACM Transactions on Information Systems (TOIS)"},{"key":"9147_CR28","doi-asserted-by":"crossref","unstructured":"Shokouhi, M. (2007). Central-rank-based collection selection in uncooperative distributed information retrieval. In Advances in information retrieval, 29th European conference on IR research. ECIR 2007, Rome, Italy, 2\u20135 April 2007, Proceedings (pp. 160\u2013172).","DOI":"10.1007\/978-3-540-71496-5_17"},{"key":"9147_CR29","doi-asserted-by":"crossref","unstructured":"Shokouhi, M., Baillie, M., & Azzopardi, L. (2007). Updating collection representations for federated search. In SIGIR \u201907: Proceedings of the 30th annual international ACM SIGIR conference on research and development in information retrieval (pp. 511\u2013518). New York: ACM.","DOI":"10.1145\/1277741.1277829"},{"key":"9147_CR30","doi-asserted-by":"crossref","unstructured":"Si, L., & Callan, J. (2003). Relevant document distribution estimation method for resource selection. In SIGIR \u201903: Proceedings of the 26th annual international ACM SIGIR conference on research and development in informaion retrieval (pp. 298\u2013305). New York: ACM.","DOI":"10.1145\/860435.860490"},{"key":"9147_CR31","doi-asserted-by":"crossref","unstructured":"Si, L., Jin, R., Callan, J., & Ogilvie, P. (2002). A language modeling framework for resource selection and results merging. In CIKM \u201902: Proceedings of the eleventh international conference on information and knowledge management (pp. 391\u2013397).  New York: ACM.","DOI":"10.1145\/584792.584856"},{"issue":"476","key":"9147_CR32","doi-asserted-by":"publisher","first-page":"1566","DOI":"10.1198\/016214506000000302","volume":"101","author":"Y. W. Teh","year":"2006","unstructured":"Teh, Y. W., Jordan,  M. I., Beal, M. J., &  Blei,  D. M.  (2006). Hierarchical dirichlet processes. Journal of the American Statistical Association 101(476), 1566\u20131581.","journal-title":"Journal of the American Statistical Association"},{"issue":"5","key":"9147_CR33","doi-asserted-by":"publisher","first-page":"581","DOI":"10.1007\/s10791-009-9094-z","volume":"12","author":"P. Thomas","year":"2009","unstructured":"Thomas, P., & Hawking, D. (2009), Server selection methods in personal metasearch: A comparative empirical study. Information Retrieval 12(5), 581\u2013604.","journal-title":"Information Retrieval"},{"key":"9147_CR34","unstructured":"Wallach, H. M, (2008). Structured topic models for language. PhD thesis, Cambridge: University of Cambridge."},{"key":"9147_CR35","doi-asserted-by":"crossref","unstructured":"Webber, W., Moffat, A., & Zobel, J. (2008). Score standardization for inter-collection comparison of retrieval systems. In SIGIR \u201908: Proceedings of the 31st annual international ACM SIGIR conference on research and development in information retrieval (pp. 51\u201358). New York: ACM.","DOI":"10.1145\/1390334.1390346"},{"key":"9147_CR36","doi-asserted-by":"crossref","unstructured":"Wei, X., & Croft, W. B. (2006). Lda-based document models for ad-hoc retrieval. In SIGIR \u201906: Proceedings of the 29th annual international ACM SIGIR conference on research and development in information retrieval (pp. 178\u2013185). New York: ACM.","DOI":"10.1145\/1148170.1148204"},{"key":"9147_CR37","doi-asserted-by":"crossref","unstructured":"Xu, J., & Croft, W. B. (1999). Cluster-based language models for distributed retrieval. In SIGIR \u201999: Proceedings of the 22nd annual international ACM SIGIR conference on research and development in information retrieval (pp. 254\u2013261). New York: ACM Press.","DOI":"10.1145\/312624.312687"}],"container-title":["Information Retrieval"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10791-010-9147-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10791-010-9147-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10791-010-9147-3","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10791-010-9147-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,2]],"date-time":"2024-01-02T14:58:42Z","timestamp":1704207522000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10791-010-9147-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2010,10,7]]},"references-count":37,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2011,8]]}},"alternative-id":["9147"],"URL":"https:\/\/doi.org\/10.1007\/s10791-010-9147-3","relation":{},"ISSN":["1386-4564","1573-7659"],"issn-type":[{"value":"1386-4564","type":"print"},{"value":"1573-7659","type":"electronic"}],"subject":[],"published":{"date-parts":[[2010,10,7]]},"assertion":[{"value":"5 February 2010","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 September 2010","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 October 2010","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}