{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,22]],"date-time":"2026-03-22T15:58:21Z","timestamp":1774195101930,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":59,"publisher":"ACM","license":[{"start":{"date-parts":[[2015,8,10]],"date-time":"2015-08-10T00:00:00Z","timestamp":1439164800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"DARPA","award":["N66001-14-1-4027"],"award-info":[{"award-number":["N66001-14-1-4027"]}]},{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["NIH-GM079656, NIH-GM066099"],"award-info":[{"award-number":["NIH-GM079656, NIH-GM066099"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["NSF DBI-1356569, NSF DBI-0851393"],"award-info":[{"award-number":["NSF DBI-1356569, NSF DBI-0851393"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2015,8,10]]},"DOI":"10.1145\/2783258.2788609","type":"proceedings-article","created":{"date-parts":[[2015,8,7]],"date-time":"2015-08-07T15:38:27Z","timestamp":1438961907000},"page":"2019-2028","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":23,"title":["Predicting Future Scientific Discoveries Based on a Networked Analysis of the Past Literature"],"prefix":"10.1145","author":[{"given":"Meenakshi","family":"Nagarajan","sequence":"first","affiliation":[{"name":"IBM Almaden Research, San Jose, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Angela D.","family":"Wilkins","sequence":"additional","affiliation":[{"name":"Baylor College of Medicine, Houston, TX, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Benjamin J.","family":"Bachman","sequence":"additional","affiliation":[{"name":"Baylor College of Medicine, Houston, TX, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ilya B.","family":"Novikov","sequence":"additional","affiliation":[{"name":"Baylor College of Medicine, Houston, TX, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shenghua","family":"Bao","sequence":"additional","affiliation":[{"name":"IBM Almaden Research, San Jose, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Peter J.","family":"Haas","sequence":"additional","affiliation":[{"name":"IBM Almaden Research, San Jose, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mar\u00eda E.","family":"Terr\u00f3n-D\u00edaz","sequence":"additional","affiliation":[{"name":"Baylor College of Medicine, Houston, TX, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sumit","family":"Bhatia","sequence":"additional","affiliation":[{"name":"IBM Research Almaden, San Jose, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Anbu K.","family":"Adikesavan","sequence":"additional","affiliation":[{"name":"Baylor College of Medicine, Houston, TX, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jacques J.","family":"Labrie","sequence":"additional","affiliation":[{"name":"IBM Research Almaden, San Jose, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sam","family":"Regenbogen","sequence":"additional","affiliation":[{"name":"Baylor College of Medicine, Houston, TX, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Christie M.","family":"Buchovecky","sequence":"additional","affiliation":[{"name":"Baylor College of Medicine, Houston, TX, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Curtis R.","family":"Pickering","sequence":"additional","affiliation":[{"name":"The University of Texas MD Anderson Cancer Center, Houston, TX, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Linda","family":"Kato","sequence":"additional","affiliation":[{"name":"IBM Research Almaden, San Jose, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Andreas M.","family":"Lisewski","sequence":"additional","affiliation":[{"name":"Baylor College of Medicine, Houston, TX, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ana","family":"Lelescu","sequence":"additional","affiliation":[{"name":"IBM Research Almaden, San Jose, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Houyin","family":"Zhang","sequence":"additional","affiliation":[{"name":"Baylor College of Medicine, Houston, TX, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Stephen","family":"Boyer","sequence":"additional","affiliation":[{"name":"IBM Research Almaden, San Jose, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Griff","family":"Weber","sequence":"additional","affiliation":[{"name":"IBM Research Almaden, San Jose, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ying","family":"Chen","sequence":"additional","affiliation":[{"name":"IBM Research Almaden, San Jose, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lawrence","family":"Donehower","sequence":"additional","affiliation":[{"name":"Baylor College of Medicine, Houston, TX, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Scott","family":"Spangler","sequence":"additional","affiliation":[{"name":"IBM Research Almaden, San Jose, CA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Olivier","family":"Lichtarge","sequence":"additional","affiliation":[{"name":"Baylor College of Medicine, Houston, TX, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2015,8,10]]},"reference":[{"key":"e_1_3_2_2_1_1","doi-asserted-by":"publisher","DOI":"10.1136\/jamia.2009.002733"},{"key":"e_1_3_2_2_2_1","doi-asserted-by":"publisher","DOI":"10.1038\/75556"},{"key":"e_1_3_2_2_3_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.csda.2006.11.006"},{"key":"e_1_3_2_2_4_1","doi-asserted-by":"publisher","DOI":"10.1186\/1471-2105-7-488"},{"key":"e_1_3_2_2_5_1","first-page":"7407","article-title":"Comprehensive molecular characterization of human colon and rectal cancer","volume":"487","author":"Cancer Genome Atlas N.","year":"2012","unstructured":"Cancer Genome Atlas , N. , 2012 . Comprehensive molecular characterization of human colon and rectal cancer . Nature 487 , 7407 (Jul 19), 330--337. Cancer Genome Atlas, N., 2012. Comprehensive molecular characterization of human colon and rectal cancer. Nature 487, 7407 (Jul 19), 330--337.","journal-title":"Nature"},{"key":"e_1_3_2_2_6_1","first-page":"7216","article-title":"Comprehensive genomic characterization defines human glioblastoma genes and core pathways","volume":"455","author":"Cancer Genome Atlas Research N.","year":"2008","unstructured":"Cancer Genome Atlas Research , N. , 2008 . Comprehensive genomic characterization defines human glioblastoma genes and core pathways . Nature 455 , 7216 (Oct 23), 1061--1068. Cancer Genome Atlas Research, N., 2008. Comprehensive genomic characterization defines human glioblastoma genes and core pathways. Nature 455, 7216 (Oct 23), 1061--1068.","journal-title":"Nature"},{"key":"e_1_3_2_2_7_1","doi-asserted-by":"crossref","unstructured":"Catral M. etal 2004. On reduced rank nonnegative matrix factorization for symmetric nonnegative matrices. Linear Algebra and its Applications 393 107--126.  Catral M. et al. 2004. On reduced rank nonnegative matrix factorization for symmetric nonnegative matrices. Linear Algebra and its Applications 393 107--126.","DOI":"10.1016\/j.laa.2003.11.024"},{"key":"e_1_3_2_2_8_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.compbiomed.2005.09.005"},{"key":"e_1_3_2_2_9_1","doi-asserted-by":"publisher","DOI":"10.1093\/bib\/6.1.57"},{"key":"e_1_3_2_2_10_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2013.12.010"},{"key":"e_1_3_2_2_11_1","volume-title":"The Comparative Toxicogenomics Database: update","author":"Davis A.P.","year":"2011","unstructured":"Davis , A.P. , The Comparative Toxicogenomics Database: update 2011 . Nucleic Acids Res 39, Database issue (Jan), D1067--1072. Davis, A.P., et al., 2011. The Comparative Toxicogenomics Database: update 2011. Nucleic Acids Res 39, Database issue (Jan), D1067--1072."},{"key":"e_1_3_2_2_12_1","doi-asserted-by":"publisher","DOI":"10.1016\/S0168-9525(02)02763-4"},{"key":"e_1_3_2_2_13_1","doi-asserted-by":"publisher","DOI":"10.1093\/nar\/gks1094"},{"key":"e_1_3_2_2_14_1","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btl616"},{"key":"e_1_3_2_2_15_1","volume-title":"The Gene Ontology project","author":"Gene Ontology C.","year":"2008","unstructured":"Gene Ontology , C. , 2008. The Gene Ontology project in 2008 . Nucleic Acids Res 36, Database issue (Jan), D440--444. Gene Ontology, C., 2008. The Gene Ontology project in 2008. Nucleic Acids Res 36, Database issue (Jan), D440--444."},{"key":"e_1_3_2_2_16_1","doi-asserted-by":"crossref","unstructured":"Gene Ontology C. 2010. The Gene Ontology in 2010: extensions and refinements. Nucleic Acids Res 38 Database issue (Jan) D331--335.  Gene Ontology C. 2010. The Gene Ontology in 2010: extensions and refinements. Nucleic Acids Res 38 Database issue (Jan) D331--335.","DOI":"10.1093\/nar\/gkp1018"},{"key":"e_1_3_2_2_17_1","doi-asserted-by":"publisher","DOI":"10.1093\/nar\/gks1066"},{"key":"e_1_3_2_2_18_1","volume-title":"I-942-I-947","author":"Guillamet D.","unstructured":"Guillamet , D. , A weighted non-negative matrix factorization for local representations IEEE , I-942-I-947 vol. 941 . Guillamet, D., et al., 2001. A weighted non-negative matrix factorization for local representations IEEE, I-942-I-947 vol. 941."},{"key":"e_1_3_2_2_19_1","doi-asserted-by":"publisher","DOI":"10.1109\/TSP.2006.879282"},{"key":"e_1_3_2_2_20_1","doi-asserted-by":"crossref","unstructured":"Hatzivassiloglou V. etal 2001. Disambiguating proteins genes and RNA in text: a machine learning approach. Bioinformatics 17 Suppl 1 suppl 1 S97--106.  Hatzivassiloglou V. et al. 2001. Disambiguating proteins genes and RNA in text: a machine learning approach. Bioinformatics 17 Suppl 1 suppl 1 S97--106.","DOI":"10.1093\/bioinformatics\/17.suppl_1.S97"},{"key":"e_1_3_2_2_21_1","doi-asserted-by":"publisher","DOI":"10.1109\/TCBB.2007.70243"},{"key":"e_1_3_2_2_22_1","doi-asserted-by":"publisher","DOI":"10.1038\/ng0704-664"},{"key":"e_1_3_2_2_23_1","doi-asserted-by":"crossref","unstructured":"Hornbeck P.V. etal 2015. PhosphoSitePlus 2014: mutations PTMs and recalibrations. Nucleic Acids Res 43 Database issue (Jan) D512--520.  Hornbeck P.V. et al. 2015. PhosphoSitePlus 2014: mutations PTMs and recalibrations. Nucleic Acids Res 43 Database issue (Jan) D512--520.","DOI":"10.1093\/nar\/gku1267"},{"key":"e_1_3_2_2_24_1","first-page":"7011","article-title":"Finishing the euchromatic sequence of the human genome","volume":"431","author":"International Human Genome Sequencing C.","year":"2004","unstructured":"International Human Genome Sequencing , C. , 2004 . Finishing the euchromatic sequence of the human genome . Nature 431 , 7011 (Oct 21), 931--945. International Human Genome Sequencing, C., 2004. Finishing the euchromatic sequence of the human genome. Nature 431, 7011 (Oct 21), 931--945.","journal-title":"Nature"},{"key":"e_1_3_2_2_25_1","doi-asserted-by":"publisher","DOI":"10.1038\/ng0501-21"},{"key":"e_1_3_2_2_26_1","volume-title":"Proc. Asian Conf. on Comp. Vision, 27--30","author":"Jia Y.W.Y.","unstructured":"Jia , Y.W.Y. and Turk , C.H.M. ,2004 Fisher non-negative matrix factorization for learning local features . In Proc. Asian Conf. on Comp. Vision, 27--30 . Jia, Y.W.Y. and Turk, C.H.M. ,2004 Fisher non-negative matrix factorization for learning local features. In Proc. Asian Conf. on Comp. Vision, 27--30."},{"key":"e_1_3_2_2_27_1","doi-asserted-by":"publisher","DOI":"10.1111\/j.1538-7836.2012.04930.x"},{"key":"e_1_3_2_2_28_1","unstructured":"Kim J.D. etal 2011. Overview of BioNLP shared task 2011 Association for Computational Linguistics 1--6.   Kim J.D. et al. 2011. Overview of BioNLP shared task 2011 Association for Computational Linguistics 1--6."},{"key":"e_1_3_2_2_29_1","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pcbi.1000454"},{"key":"e_1_3_2_2_30_1","volume-title":"Proceedings of the 48th Annual Meeting of the Association for Computational Linguistics","author":"Laura C.","year":"2010","unstructured":"Laura , C. , , 2010 . SystemT: an algebraic approach to declarative information extraction . In Proceedings of the 48th Annual Meeting of the Association for Computational Linguistics , Uppsala, Sweden, 128--137. Laura, C., et al., 2010. SystemT: an algebraic approach to declarative information extraction. In Proceedings of the 48th Annual Meeting of the Association for Computational Linguistics, Uppsala, Sweden, 128--137."},{"key":"e_1_3_2_2_31_1","doi-asserted-by":"publisher","DOI":"10.1038\/44565"},{"key":"e_1_3_2_2_32_1","unstructured":"Lee D.D. and Seung H.S. 2000. Algorithms for Non-negative Matrix Factorization. In NIPS 556--562.  Lee D.D. and Seung H.S. 2000. Algorithms for Non-negative Matrix Factorization. In NIPS 556--562."},{"key":"e_1_3_2_2_33_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.physa.2010.04.005"},{"key":"e_1_3_2_2_34_1","volume-title":"Introduction to Information Retrieval","author":"Manning C.D.","unstructured":"Manning , C.D. , Introduction to Information Retrieval . Cambridge University Press Cambridge . Manning, C.D., et al., 2008. Introduction to Information Retrieval. Cambridge University Press Cambridge."},{"key":"e_1_3_2_2_35_1","unstructured":"Manning C.D. and Sch\u00fctze H. 1999. Foundations of statistical natural language processing. MIT press.   Manning C.D. and Sch\u00fctze H. 1999. Foundations of statistical natural language processing. MIT press."},{"key":"e_1_3_2_2_36_1","unstructured":"Mccord M.C. and Bernth A. 2010. Using slot grammar. IBM TJ Watson Res. Center Yorktown Heights NY IBM Res. Rep. RC23978.  Mccord M.C. and Bernth A. 2010. Using slot grammar. IBM TJ Watson Res. Center Yorktown Heights NY IBM Res. Rep. RC23978."},{"key":"e_1_3_2_2_37_1","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btn631"},{"key":"e_1_3_2_2_38_1","volume-title":"Proceedings of the BioNLP Shared Task 2013 Workshop, 1--7.","author":"N\u00e9dellec C.","year":"2013","unstructured":"N\u00e9dellec , C. , , 2013 . Overview of BioNLP shared task 2013 . Proceedings of the BioNLP Shared Task 2013 Workshop, 1--7. N\u00e9dellec, C., et al., 2013. Overview of BioNLP shared task 2013. Proceedings of the BioNLP Shared Task 2013 Workshop, 1--7."},{"key":"e_1_3_2_2_39_1","doi-asserted-by":"publisher","DOI":"10.1002\/env.3170050203"},{"key":"e_1_3_2_2_40_1","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btu383"},{"key":"e_1_3_2_2_41_1","doi-asserted-by":"publisher","DOI":"10.1186\/1471-2105-8-50"},{"key":"e_1_3_2_2_42_1","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0102039"},{"key":"e_1_3_2_2_43_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.jbi.2003.10.001"},{"key":"e_1_3_2_2_44_1","unstructured":"Salton G. and Mcgill M.J. 1986. Introduction to Modern Information Retrieval. McGraw-Hill Inc.   Salton G. and Mcgill M.J. 1986. Introduction to Modern Information Retrieval. McGraw-Hill Inc."},{"key":"e_1_3_2_2_45_1","doi-asserted-by":"publisher","DOI":"10.1145\/2623330.2623667"},{"key":"e_1_3_2_2_46_1","doi-asserted-by":"publisher","DOI":"10.1145\/2623330.2623667"},{"key":"e_1_3_2_2_47_1","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.0708078105"},{"key":"e_1_3_2_2_48_1","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/18.8.1124"},{"key":"e_1_3_2_2_49_1","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pcbi.1000837"},{"key":"e_1_3_2_2_50_1","doi-asserted-by":"publisher","DOI":"10.1038\/nprot.2011.367"},{"key":"e_1_3_2_2_51_1","volume-title":"Update on activities at the Universal Protein Resource (UniProt)","author":"Uniprot C.","year":"2013","unstructured":"Uniprot , C. , 2013. Update on activities at the Universal Protein Resource (UniProt) in 2013 . Nucleic Acids Res 41, Database issue (Jan), D43--47. Uniprot, C., 2013. Update on activities at the Universal Protein Resource (UniProt) in 2013. Nucleic Acids Res 41, Database issue (Jan), D43--47."},{"key":"e_1_3_2_2_52_1","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0055814"},{"key":"e_1_3_2_2_53_1","doi-asserted-by":"publisher","DOI":"10.1089\/cmb.2012.0273"},{"key":"e_1_3_2_2_54_1","doi-asserted-by":"publisher","DOI":"10.1093\/nar\/gkg033"},{"key":"e_1_3_2_2_55_1","doi-asserted-by":"crossref","unstructured":"Wishart D.S. etal 2009. HMDB: a knowledgebase for the human metabolome. Nucleic Acids Res 37 Database issue (Jan) D603--610.  Wishart D.S. et al. 2009. HMDB: a knowledgebase for the human metabolome. Nucleic Acids Res 37 Database issue (Jan) D603--610.","DOI":"10.1093\/nar\/gkn810"},{"key":"e_1_3_2_2_56_1","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btp631"},{"key":"e_1_3_2_2_57_1","doi-asserted-by":"crossref","unstructured":"You Z.H. etal 2013. Prediction of protein-protein interactions from amino acid sequences with ensemble extreme learning machines and principal component analysis. BMC bioinformatics 14 Suppl 8 S10.  You Z.H. et al. 2013. Prediction of protein-protein interactions from amino acid sequences with ensemble extreme learning machines and principal component analysis. BMC bioinformatics 14 Suppl 8 S10.","DOI":"10.1186\/1471-2105-14-S8-S10"},{"key":"e_1_3_2_2_58_1","doi-asserted-by":"publisher","DOI":"10.1038\/nature11503"},{"key":"e_1_3_2_2_59_1","doi-asserted-by":"publisher","DOI":"10.1038\/srep03202"}],"event":{"name":"KDD '15: The 21th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining","location":"Sydney NSW Australia","acronym":"KDD '15","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data"]},"container-title":["Proceedings of the 21th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2783258.2788609","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/2783258.2788609","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T05:07:14Z","timestamp":1750223234000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2783258.2788609"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,8,10]]},"references-count":59,"alternative-id":["10.1145\/2783258.2788609","10.1145\/2783258"],"URL":"https:\/\/doi.org\/10.1145\/2783258.2788609","relation":{},"subject":[],"published":{"date-parts":[[2015,8,10]]},"assertion":[{"value":"2015-08-10","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}