{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T04:59:29Z","timestamp":1750309169436,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":33,"publisher":"ACM","license":[{"start":{"date-parts":[[2008,10,26]],"date-time":"2008-10-26T00:00:00Z","timestamp":1224979200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2008,10,26]]},"DOI":"10.1145\/1458082.1458186","type":"proceedings-article","created":{"date-parts":[[2008,11,11]],"date-time":"2008-11-11T12:59:40Z","timestamp":1226408380000},"page":"779-786","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":7,"title":["Identification of gene function using prediction by partial matching (PPM) language models"],"prefix":"10.1145","author":[{"given":"Malika","family":"Mahoui","sequence":"first","affiliation":[{"name":"IUPUI, Indianapolis, IN, USA"}]},{"given":"William John","family":"Teahan","sequence":"additional","affiliation":[{"name":"University of Wales, Bangor, Wales, United Kngdm"}]},{"given":"Arvind Kumar","family":"Thirumalaiswamy Sekhar","sequence":"additional","affiliation":[{"name":"Dow AgroSciences, Indianapolis, IN, USA"}]},{"given":"Satyasaibabu","family":"Chilukuri","sequence":"additional","affiliation":[{"name":"IUPUI, Indianapolis, IN, USA"}]}],"member":"320","published-online":{"date-parts":[[2008,10,26]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"PubMed; http:\/\/www.ncbi.nlm.nih.gov\/entrez\/ (2008).  PubMed; http:\/\/www.ncbi.nlm.nih.gov\/entrez\/ (2008)."},{"key":"e_1_3_2_1_2_1","first-page":"339","volume-title":"APBC","author":"Fukuda K.","year":"2004"},{"volume-title":"EMBO Workshop: A critical assessment of text mining methods in molecular biology","year":"2004","author":"Bickel S.","key":"e_1_3_2_1_3_1"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"crossref","unstructured":"Ono T Hishigaki H Tanigami A Takagi T. (2001) \"Automated extraction of information on protein-protein interactions from the biological literature\". Bioinformatics Feb;17(2):155--61.  Ono T Hishigaki H Tanigami A Takagi T. (2001) \"Automated extraction of information on protein-protein interactions from the biological literature\". Bioinformatics Feb;17(2):155--61.","DOI":"10.1093\/bioinformatics\/17.2.155"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/bth904"},{"volume-title":"Pacific Symposium on Biocomputing.,403--414","year":"2003","author":"Hanisch D.","key":"e_1_3_2_1_6_1"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.3115\/1118958.1118967"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btg393"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/bti084"},{"key":"e_1_3_2_1_10_1","volume-title":"Bioinformatics","volume":"19","author":"Chiang J.H.","year":"2003"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"crossref","unstructured":"Raychaudhuri S. Chang J.T. Sutphin P.D. Altman R.B. (2002) \"Associating genes with gene ontology codes using a maximum entropy analysis of biomedical literature\". Genome Research. Jan;12(1):203--14.  Raychaudhuri S. Chang J.T. Sutphin P.D. Altman R.B. (2002) \"Associating genes with gene ontology codes using a maximum entropy analysis of biomedical literature\". Genome Research. Jan;12(1):203--14.","DOI":"10.1101\/gr.199701"},{"key":"e_1_3_2_1_12_1","unstructured":"Seki K. Mostafa J. (2003) \"Towards database curation in biology automated gene function identification from text\" Tech. report Indiana University http:\/\/lair.slis.indiana.edu\/research\/capris\/papers.html.  Seki K. Mostafa J. (2003) \"Towards database curation in biology automated gene function identification from text\" Tech. report Indiana University http:\/\/lair.slis.indiana.edu\/research\/capris\/papers.html."},{"key":"e_1_3_2_1_13_1","unstructured":"Gene ontology. (2007) http:\/\/www.geneontology.org\/ .  Gene ontology. (2007) http:\/\/www.geneontology.org\/ ."},{"key":"e_1_3_2_1_14_1","unstructured":"NCBI. (2008) http:\/\/www.ncbi.nlm.nih.gov\/.  NCBI. (2008) http:\/\/www.ncbi.nlm.nih.gov\/."},{"key":"e_1_3_2_1_15_1","unstructured":"GeneRIF.(2007) http:\/\/www.ncbi.nlm.nih.gov\/projects\/GeneRIF\/GeneRIFhelp.html.  GeneRIF.(2007) http:\/\/www.ncbi.nlm.nih.gov\/projects\/GeneRIF\/GeneRIFhelp.html."},{"key":"e_1_3_2_1_16_1","unstructured":"Teahan W.J. (2006) The Text Mining Toolkit. http:\/\/www.cs.bangor.ac.uk\/~wjt.  Teahan W.J. (2006) The Text Mining Toolkit. http:\/\/www.cs.bangor.ac.uk\/~wjt."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/TCOM.1984.1096090"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/26.61469"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"crossref","unstructured":"Teahan W. J. &amp; Harper D. J. (2003) \"Using compression-based language models for text categorization\". Language Modeling for Information Retrieval edited by W. B. Croft &amp; J. Lafferty Kluwer. page(s) 141--166.  Teahan W. J. &amp; Harper D. J. (2003) \"Using compression-based language models for text categorization\". Language Modeling for Information Retrieval edited by W. B. Croft &amp; J. Lafferty Kluwer. page(s) 141--166.","DOI":"10.1007\/978-94-017-0171-6_7"},{"key":"e_1_3_2_1_20_1","unstructured":"Teahan W.J. (1998) \"Modelling English Text\" Ph.D. thesis Dept. of Computer Science The University of Waikato.  Teahan W.J. (1998) \"Modelling English Text\" Ph.D. thesis Dept. of Computer Science The University of Waikato."},{"key":"e_1_3_2_1_21_1","unstructured":"Bell T. Cleary J. and Witten I. (1990) Text Compression. Prentice Hall.   Bell T. Cleary J. and Witten I. (1990) Text Compression. Prentice Hall."},{"key":"e_1_3_2_1_22_1","unstructured":"Howard P.G. (1993) The Design and Analysis of Efficient Lossless Data Compression Systems. Ph.D. Thesis Brown University.   Howard P.G. (1993) The Design and Analysis of Efficient Lossless Data Compression Systems. Ph.D. Thesis Brown University."},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.5555\/789086.789617"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1145\/319382.319394"},{"key":"e_1_3_2_1_25_1","unstructured":"Jelinek F. (1985) \"Self-organized Language Modeling for Speech Recognition \" IBM Report.  Jelinek F. (1985) \"Self-organized Language Modeling for Speech Recognition \" IBM Report."},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1002\/j.1538-7305.1948.tb01338.x"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.1967.1054010"},{"volume-title":"PRICAI'2000 Workshop on Text and Data Mining, pages. 52--63","year":"2000","author":"Yeates S.","key":"e_1_3_2_1_28_1"},{"key":"e_1_3_2_1_29_1","first-page":"582","volume-title":"Proc Data Compression Conference","author":"Yeates S.","year":"2000"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.5555\/882454.875121"},{"key":"e_1_3_2_1_31_1","first-page":"943","volume-title":"Proceedings of the International Conference on Content-based Multimedia Information Access (RIAO","author":"Teahan W.","year":"2000"},{"key":"e_1_3_2_1_32_1","unstructured":"GeneRIF help. (2007) http:\/\/www.ncbi.nlm.nih.gov\/projects\/GeneRIF\/GeneRIFhelp.html.  GeneRIF help. (2007) http:\/\/www.ncbi.nlm.nih.gov\/projects\/GeneRIF\/GeneRIFhelp.html."},{"volume-title":"IEEE Data Compression Conference","author":"Cleary J.G.","key":"e_1_3_2_1_33_1"}],"event":{"name":"CIKM08: Conference on Information and Knowledge Management","sponsor":["SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web","ACM Association for Computing Machinery","SIGIR ACM Special Interest Group on Information Retrieval"],"location":"Napa Valley California USA","acronym":"CIKM08"},"container-title":["Proceedings of the 17th ACM conference on Information and knowledge management"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/1458082.1458186","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/1458082.1458186","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T22:53:44Z","timestamp":1750287224000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/1458082.1458186"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2008,10,26]]},"references-count":33,"alternative-id":["10.1145\/1458082.1458186","10.1145\/1458082"],"URL":"https:\/\/doi.org\/10.1145\/1458082.1458186","relation":{},"subject":[],"published":{"date-parts":[[2008,10,26]]},"assertion":[{"value":"2008-10-26","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}