{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,12]],"date-time":"2026-06-12T06:37:43Z","timestamp":1781246263630,"version":"3.54.1"},"reference-count":41,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2008,2,19]],"date-time":"2008-02-19T00:00:00Z","timestamp":1203379200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/2.0"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"published-print":{"date-parts":[[2008,12]]},"DOI":"10.1186\/1471-2105-9-108","type":"journal-article","created":{"date-parts":[[2008,2,19]],"date-time":"2008-02-19T14:41:56Z","timestamp":1203432116000},"source":"Crossref","is-referenced-by-count":44,"title":["MScanner: a classifier for retrieving Medline citations"],"prefix":"10.1186","volume":"9","author":[{"given":"Graham L","family":"Poulter","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Daniel L","family":"Rubin","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Russ B","family":"Altman","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Cathal","family":"Seoighe","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2008,2,19]]},"reference":[{"key":"2093_CR1","unstructured":"Fact Sheet: MEDLINE[ http:\/\/www.nlm.nih.gov\/pubs\/factsheets\/medline.html ]"},{"key":"2093_CR2","unstructured":"Fact Sheet: PubMed\u00ae: MEDLINE\u00aeR Retrieval on the World Wide Web[ http:\/\/www.nlm.nih.gov\/pubs\/factsheets\/pubmed.html ]"},{"key":"2093_CR3","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/1472-6947-7-1","volume":"7","author":"MS Siadaty","year":"2007","unstructured":"Siadaty MS, Shu J, Knaus WA: Relemed: sentence-level search engine with relevance score for the MEDLINE database of biomedical articles. BMC Med Inform Decis Mak 2007, 7: 1.","journal-title":"BMC Med Inform Decis Mak"},{"issue":"2","key":"2093_CR4","doi-asserted-by":"publisher","first-page":"e237","DOI":"10.1093\/bioinformatics\/btl302","volume":"23","author":"D Rebholz-Schuhmann","year":"2007","unstructured":"Rebholz-Schuhmann D, Kirsch H, Arregui M, Gaudan S, Riethoven M, Stoehr P: EBIMed--text crunching to gather facts for proteins from Medline. Bioinformatics 2007, 23(2):e237-e244.","journal-title":"Bioinformatics"},{"key":"2093_CR5","unstructured":"Google Scholar[ http:\/\/scholar.google.com ]"},{"key":"2093_CR6","doi-asserted-by":"publisher","first-page":"423","DOI":"10.1186\/1471-2105-8-423","volume":"8","author":"J Lin","year":"2007","unstructured":"Lin J, Wilbur WJ: PubMed related articles: a probabilistic topic-based model for content similarity. BMC Bioinformatics 2007, 8: 423.","journal-title":"BMC Bioinformatics"},{"issue":"18","key":"2093_CR7","doi-asserted-by":"publisher","first-page":"2298","DOI":"10.1093\/bioinformatics\/btl388","volume":"22","author":"J Lewis","year":"2006","unstructured":"Lewis J, Ossowski S, Hicks J, Errami M, Garner HR: Text similarity: an alternative way to search MEDLINE. Bioinformatics 2006, 22(18):2298\u20132304.","journal-title":"Bioinformatics"},{"key":"2093_CR8","doi-asserted-by":"publisher","first-page":"163","DOI":"10.1093\/nar\/30.1.163","volume":"30","author":"M Hewett","year":"2002","unstructured":"Hewett M, Oliver DE, Rubin DL, Easton KL, Stuart JM, Altman RB, Klein TE: PharmGKB: the Pharmacogenetics Knowledge Base. Nucleic Acids Res 2002, 30: 163\u2013165.","journal-title":"Nucleic Acids Res"},{"key":"2093_CR9","doi-asserted-by":"publisher","first-page":"370","DOI":"10.1186\/1471-2105-7-370","volume":"7","author":"D Chen","year":"2006","unstructured":"Chen D, M\u00fcller HM, Sternberg PW: Automatic document classification of biological literature. BMC Bioinformatics 2006, 7: 370.","journal-title":"BMC Bioinformatics"},{"issue":"11","key":"2093_CR10","doi-asserted-by":"publisher","first-page":"e309","DOI":"10.1371\/journal.pbio.0020309","volume":"2","author":"HM M\u00fcller","year":"2004","unstructured":"M\u00fcller HM, Kenny EE, Sternberg PW: Textpresso: an ontology-based information retrieval and extraction system for biological literature. PLoS Biol 2004, 2(11):e309.","journal-title":"PLoS Biol"},{"key":"2093_CR11","first-page":"7","volume-title":"Proceedings of ASAI-99, 1st Argentinian Symposium on Artificial Intelligence","author":"F Sebastiani","year":"1999","unstructured":"Sebastiani F: A Tutorial on Automated Text Categorisation. In Proceedings of ASAI-99, 1st Argentinian Symposium on Artificial Intelligence Edited by: Amandi A, Zunino R, Buenos Aires AR. 1999, 7\u201335."},{"key":"2093_CR12","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/505282.505283","volume":"34","author":"F Sebastiani","year":"2002","unstructured":"Sebastiani F: Machine learning in automated text categorization. ACM Comput Surv 2002, 34: 1\u201347.","journal-title":"ACM Comput Surv"},{"key":"2093_CR13","doi-asserted-by":"publisher","first-page":"137","DOI":"10.1007\/BFb0026683","volume-title":"ECML '98: Proceedings of the 10th European Conference on Machine Learning","author":"T Joachims","year":"1998","unstructured":"Joachims T: Text Categorization with Support Vector Machines: Learning with Many Relevant Features. In ECML '98: Proceedings of the 10th European Conference on Machine Learning. London, UK: Springer-Verlag; 1998:137\u2013142."},{"key":"2093_CR14","doi-asserted-by":"publisher","first-page":"57","DOI":"10.1093\/bib\/6.1.57","volume":"6","author":"AM Cohen","year":"2005","unstructured":"Cohen AM, Hersh WR: A survey of current work in biomedical text mining. Brief Bioinform 2005, 6: 57\u201371.","journal-title":"Brief Bioinform"},{"key":"2093_CR15","doi-asserted-by":"publisher","first-page":"269","DOI":"10.1186\/1471-2105-8-269","volume":"8","author":"P Wang","year":"2007","unstructured":"Wang P, Morgan AA, Zhang Q, Sette A, Peters B: Automating document classification for the Immune Epitope Database. BMC Bioinformatics 2007, 8: 269.","journal-title":"BMC Bioinformatics"},{"issue":"5","key":"2093_CR16","doi-asserted-by":"publisher","first-page":"404","DOI":"10.1016\/j.jbi.2005.02.008","volume":"38","author":"TA Lasko","year":"2005","unstructured":"Lasko TA, Bhagwat JG, Zou KH, Ohno-Machado L: The use of receiver operating characteristic curves in biomedical informatics. J Biomed Inform 2005, 38(5):404\u2013415.","journal-title":"J Biomed Inform"},{"key":"2093_CR17","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1186\/1471-2105-4-11","volume":"4","author":"I Donaldson","year":"2003","unstructured":"Donaldson I, Martin J, de Bruijn B, Wolting C, Lay V, Tuekam B, Zhang S, Baskin B, Bader GD, Michalickova K, Pawson T, Hogue CWV: PreBIND and Textomy-mining the biomedical literature for protein-protein interactions using a support vector machine. BMC Bioinformatics 2003, 4: 11.","journal-title":"BMC Bioinformatics"},{"issue":"2","key":"2093_CR18","doi-asserted-by":"publisher","first-page":"207","DOI":"10.1197\/jamia.M1641","volume":"12","author":"Y Aphinyanaphongs","year":"2005","unstructured":"Aphinyanaphongs Y, Tsamardinos I, Statnikov A, Hardin D, Aliferis CF: Text categorization models for high-quality article retrieval in internal medicine. J Am Med Inform Assoc 2005, 12(2):207\u2013216.","journal-title":"J Am Med Inform Assoc"},{"issue":"4","key":"2093_CR19","doi-asserted-by":"publisher","first-page":"359","DOI":"10.1093\/bioinformatics\/17.4.359","volume":"17","author":"EM Marcotte","year":"2001","unstructured":"Marcotte EM, Xenarios I, Eisenberg D: Mining literature for protein-protein interactions. Bioinformatics 2001, 17(4):359\u2013363.","journal-title":"Bioinformatics"},{"key":"2093_CR20","volume-title":"The Fourteenth Text REtrieval Conference (TREC 2005)","author":"W Hersh","year":"2005","unstructured":"Hersh W, Cohen A, Yang J, Bhupatiraju R, Roberts P, Hearst M: TREC 2005 Genomics Track Overview. The Fourteenth Text REtrieval Conference (TREC 2005) 2005."},{"key":"2093_CR21","first-page":"161","volume-title":"AMIA Annu Symp Proc","author":"AM Cohen","year":"2006","unstructured":"Cohen AM: An effective general purpose approach for automated biomedical document classification. AMIA Annu Symp Proc 2006, 161\u2013165."},{"key":"2093_CR22","doi-asserted-by":"publisher","first-page":"75","DOI":"10.1186\/1471-2105-6-75","volume":"6","author":"BP Suomela","year":"2005","unstructured":"Suomela BP, Andrade MA: Ranking the whole MEDLINE database according to a large training set using text indexing. BMC Bioinformatics 2005, 6: 75.","journal-title":"BMC Bioinformatics"},{"issue":"2","key":"2093_CR23","doi-asserted-by":"publisher","first-page":"121","DOI":"10.1197\/jamia.M1640","volume":"12","author":"DL Rubin","year":"2005","unstructured":"Rubin DL, Thorn CF, Klein TE, Altman RB: A statistical approach to scanning the biomedical literature for pharmacogenetics knowledge. J Am Med Inform Assoc 2005, 12(2):121\u2013129.","journal-title":"J Am Med Inform Assoc"},{"key":"2093_CR24","doi-asserted-by":"crossref","unstructured":"Goetz T, von der Lieth CW: PubFinder: a tool for improving retrieval rate of relevant PubMed abstracts. Nucleic Acids Res 2005, (33 Web Server):W774-W778.","DOI":"10.1093\/nar\/gki429"},{"issue":"14","key":"2093_CR25","doi-asserted-by":"publisher","first-page":"e220","DOI":"10.1093\/bioinformatics\/btl203","volume":"22","author":"H Jang","year":"2006","unstructured":"Jang H, Lim J, Lim JH, Park SJ, Lee KC, Park SH: Finding the evidence for protein-protein interactions from PubMed abstracts. Bioinformatics 2006, 22(14):e220-e226.","journal-title":"Bioinformatics"},{"key":"2093_CR26","first-page":"750","volume-title":"Proc AMIA Symp","author":"X Liu","year":"1998","unstructured":"Liu X, Altman RB: Updating a bibliography using the related articles function within PubMed. Proc AMIA Symp 1998, 750\u2013754."},{"issue":"3","key":"2093_CR27","first-page":"189","volume":"2","author":"C Perez-Iratxeta","year":"2003","unstructured":"Perez-Iratxeta C, Astola N, Ciccarelli FD, Sha PK, Bork P, Andrade MA: A protocol for the update of references to scientific literature in biological databases. Appl Bioinformatics 2003, 2(3):189\u2013191.","journal-title":"Appl Bioinformatics"},{"issue":"3","key":"2093_CR28","doi-asserted-by":"publisher","first-page":"243","DOI":"10.1093\/comjnl\/35.3.243","volume":"35","author":"N Fuhr","year":"1992","unstructured":"Fuhr N: Probabilistic models in information retrieval. Comput J 1992, 35(3):243\u2013255.","journal-title":"Comput J"},{"issue":"6","key":"2093_CR29","doi-asserted-by":"publisher","first-page":"488","DOI":"10.1016\/j.ijmedinf.2005.06.007","volume":"75","author":"I Tbahriti","year":"2005","unstructured":"Tbahriti I, Chichester C, Lisacek F, Ruch P: Using argumentation to retrieve articles with similar citations: an inquiry into improving related articles search in the MEDLINE digital library. Int J Med Inform 2005, 75(6):488\u2013495.","journal-title":"Int J Med Inform"},{"key":"2093_CR30","doi-asserted-by":"publisher","first-page":"2","DOI":"10.1186\/1747-5333-1-2","volume":"1","author":"W Zhou","year":"2006","unstructured":"Zhou W, Smalheiser NR, Yu C: A tutorial on information retrieval: basic terms and concepts. J Biomed Discov Collab 2006, 1: 2.","journal-title":"J Biomed Discov Collab"},{"key":"2093_CR31","doi-asserted-by":"publisher","first-page":"29","DOI":"10.1148\/radiology.143.1.7063747","volume":"143","author":"JA Hanley","year":"1982","unstructured":"Hanley JA, McNeil BJ: The meaning and use of the area under a receiver operating characteristic (ROC) curve. Radiology 1982, 143: 29\u201336.","journal-title":"Radiology"},{"issue":"9","key":"2093_CR32","doi-asserted-by":"publisher","first-page":"577","DOI":"10.1097\/00008571-200409000-00002","volume":"14","author":"JT Chang","year":"2004","unstructured":"Chang JT, Altman RB: Extracting and characterizing gene-drug relationships from the literature. Pharmacogenetics 2004, 14(9):577\u2013586.","journal-title":"Pharmacogenetics"},{"key":"2093_CR33","first-page":"233","volume-title":"ICML 2006: Proceedings of the 23rd International Conference on Machine learning","author":"J Davis","year":"2006","unstructured":"Davis J, Goadrich M: The relationship between Precision-Recall and ROC curves. In ICML 2006: Proceedings of the 23rd International Conference on Machine learning. New York, NY, USA: ACM Press; 2006:233\u2013240."},{"key":"2093_CR34","doi-asserted-by":"publisher","first-page":"115","DOI":"10.1177\/154407370301700126","volume":"17","author":"WC Bartling","year":"2003","unstructured":"Bartling WC, Schleyer TK, Visweswaran S: Retrieval and classification of dental research articles. Adv Dent Res 2003, 17: 115\u2013120.","journal-title":"Adv Dent Res"},{"key":"2093_CR35","volume-title":"Tech. rep., Just Research","author":"A McCallum","year":"1998","unstructured":"McCallum A, Nigam K: A comparison of event models for Naive Bayes text classification. Tech. rep., Just Research 1998."},{"key":"2093_CR36","doi-asserted-by":"publisher","first-page":"33","DOI":"10.3115\/1118935.1118940","volume-title":"IRAL 2003: Proceedings of the Sixth International Workshop on Information Retrieval with Asian Languages","author":"SB Kim","year":"2003","unstructured":"Kim SB, Seo HC, Rim HC: Poisson naive Bayes for text classification with feature weighting. In IRAL 2003: Proceedings of the Sixth International Workshop on Information Retrieval with Asian Languages. Morristown, NJ, USA: Association for Computational Linguistics; 2003:33\u201340."},{"key":"2093_CR37","doi-asserted-by":"publisher","DOI":"10.1007\/b137845","volume-title":"Statistical Methods in Bioinformatics: An Introduction","author":"WJ Ewens","year":"2005","unstructured":"Ewens WJ, Grant GR: Statistical Methods in Bioinformatics: An Introduction. 2nd edition. Springer; 2005.","edition":"2"},{"key":"2093_CR38","volume-title":"Python Reference Manual. Virginia, USA","author":"G van Rossum","year":"2001","unstructured":"van Rossum G, Drake FL:Python Reference Manual. Virginia, USA. 2001. [ http:\/\/www.python.org ]"},{"key":"2093_CR39","unstructured":"2007 MEDLINE\u00aeR\/PubMed\u00aeR Baseline Distribution[ http:\/\/www.nlm.nih.gov\/bsd\/licensee\/2007_stats\/baseline_doc.html ]"},{"key":"2093_CR40","unstructured":"National Library of Medicine AIDS Subset Strategy[ http:\/\/www.nlm.nih.gov\/bsd\/pubmed_subsets\/aids_strategy.html ]"},{"key":"2093_CR41","unstructured":"National Library of Medicine Bioethics Subset Strategy[ http:\/\/www.nlm.nih.gov\/bsd\/pubmed_subsets\/bioethics_strategy.html ]"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1471-2105-9-108.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/1471-2105-9-108\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1471-2105-9-108.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,8]],"date-time":"2019-05-08T00:19:18Z","timestamp":1557274758000},"score":1,"resource":{"primary":{"URL":"https:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/1471-2105-9-108"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2008,2,19]]},"references-count":41,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2008,12]]}},"alternative-id":["2093"],"URL":"https:\/\/doi.org\/10.1186\/1471-2105-9-108","relation":{},"ISSN":["1471-2105"],"issn-type":[{"value":"1471-2105","type":"electronic"}],"subject":[],"published":{"date-parts":[[2008,2,19]]},"article-number":"108"}}