{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,22]],"date-time":"2026-01-22T12:19:09Z","timestamp":1769084349803,"version":"3.49.0"},"reference-count":35,"publisher":"American Chemical Society (ACS)","issue":"9","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["J. Chem. Inf. Model."],"published-print":{"date-parts":[[2011,9,26]]},"DOI":"10.1021\/ci2001988","type":"journal-article","created":{"date-parts":[[2011,7,31]],"date-time":"2011-07-31T14:37:10Z","timestamp":1312123030000},"page":"2186-2208","source":"Crossref","is-referenced-by-count":15,"title":["Self-Contained Sequence Representation: Bridging the Gap between Bioinformatics and Cheminformatics"],"prefix":"10.1021","volume":"51","author":[{"given":"William L.","family":"Chen","sequence":"first","affiliation":[{"name":"Accelrys, Incorporated, 2440 Camino Ramon, Suite 300, San Ramon, California 94583, United States"}]},{"given":"Burton A.","family":"Leland","sequence":"additional","affiliation":[{"name":"Accelrys, Incorporated, 2440 Camino Ramon, Suite 300, San Ramon, California 94583, United States"}]},{"given":"Joseph L.","family":"Durant","sequence":"additional","affiliation":[{"name":"Accelrys, Incorporated, 2440 Camino Ramon, Suite 300, San Ramon, California 94583, United States"}]},{"given":"David L.","family":"Grier","sequence":"additional","affiliation":[{"name":"Accelrys, Incorporated, 2440 Camino Ramon, Suite 300, San Ramon, California 94583, United States"}]},{"given":"Bradley D.","family":"Christie","sequence":"additional","affiliation":[{"name":"Accelrys, Incorporated, 2440 Camino Ramon, Suite 300, San Ramon, California 94583, United States"}]},{"given":"James G.","family":"Nourse","sequence":"additional","affiliation":[{"name":"Accelrys, Incorporated, 2440 Camino Ramon, Suite 300, San Ramon, California 94583, United States"}]},{"given":"Keith T.","family":"Taylor","sequence":"additional","affiliation":[{"name":"Accelrys, Incorporated, 2440 Camino Ramon, Suite 300, San Ramon, California 94583, United States"}]}],"member":"316","published-online":{"date-parts":[[2011,8,22]]},"reference":[{"issue":"1","key":"ref1\/cit1","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1038\/nbt0110-1","volume":"28","year":"2010","journal-title":"Nat. Biotechnol."},{"issue":"10","key":"ref2\/cit2","doi-asserted-by":"crossref","first-page":"R104","DOI":"10.1186\/gb-2010-11-10-r104","volume":"11","author":"Sboner A.","year":"2010","journal-title":"Genome Biol."},{"key":"ref3\/cit3","doi-asserted-by":"crossref","first-page":"441","DOI":"10.1038\/nature08817","volume":"464","author":"Neumann H.","year":"2010","journal-title":"Nature"},{"key":"ref4\/cit4","doi-asserted-by":"crossref","first-page":"52","DOI":"10.1126\/science.1190719","volume":"329","author":"Gibson D. G.","year":"2010","journal-title":"Science"},{"key":"ref5\/cit5","first-page":"375","volume":"33","author":"Brown F.","year":"1998","journal-title":"Annu. Rep. Med. Chem."},{"key":"ref6\/cit6","doi-asserted-by":"crossref","first-page":"2230","DOI":"10.1021\/ci060016u","volume":"46","author":"Chen W. L.","year":"2006","journal-title":"J. Chem. Inf. Model."},{"key":"ref7\/cit7","first-page":"483","volume-title":"Computational Medicinal Chemistry and Drug Discovery","author":"Chen L.","year":"2004"},{"key":"ref8\/cit8","unstructured":"Taylor, K. T.Meeting the challenges of representing large, modified biopolymers.White paper;Symyx,San Ramon, CA;http:\/\/www.symyx.com\/products\/pdfs\/biopolymer_whitepaper.pdf(accessed July 11, 2011) ."},{"key":"ref9\/cit9","doi-asserted-by":"crossref","first-page":"2404","DOI":"10.1021\/ci800128b","volume":"48","author":"Jensen J. H.","year":"2008","journal-title":"J. Chem. Inf. Model."},{"key":"ref10\/cit10","unstructured":"Chen, W. L.Self-Contained Sequence Representation: A Proposal; Unpublished work;Elsevier MDL,San Ramon, CA, 2005."},{"key":"ref11\/cit11","unstructured":"Chen, W. L.The NEMA Algorithm for Stereochemistry Perception; Unpublished work;Elsevier MDL,San Ramon, CA, 2006."},{"key":"ref12\/cit12","doi-asserted-by":"crossref","first-page":"403","DOI":"10.1016\/S0022-2836(05)80360-2","volume":"215","author":"Altschul S. F.","year":"1990","journal-title":"J. Mol. Biol."},{"key":"ref13\/cit13","doi-asserted-by":"crossref","first-page":"244","DOI":"10.1021\/ci00007a012","volume":"32","author":"Dalby A.","year":"1992","journal-title":"J. Chem. Inf. Comput. Sci."},{"key":"ref14\/cit14","unstructured":"Symyx Direct bridges the gap between bioinformatics and cheminformatics, 2010.http:\/\/www.biovalley.com\/content.cfm?nav=6&content=19&command=details&id=14130(accessed June 30, 2011) .BioValley: The Life Sciences Network:Illkirch, France."},{"key":"ref15\/cit15","unstructured":"New Drawing Software From Accelrys Bridges Chemistry and Biology;Accelrys:San Diego, CA, 2010; http:\/\/ir.accelrys.com\/releasedetail.cfm?releaseid=537233(accessed June 30, 2011)."},{"key":"ref16\/cit16","unstructured":"Accelrys Draw\u2013 no fee;Accelrys:San Diego, CA;http:\/\/accelrys.com\/products\/informatics\/cheminformatics\/draw\/no-fee.php(accessed July 11, 2011) ."},{"key":"ref17\/cit17","unstructured":"CTfile Formats;Accelrys:San Diego, CA;http:\/\/accelrys.com\/products\/informatics\/cheminformatics\/ctfile-formats\/no-fee.php(accessed July 11, 2011) ."},{"key":"ref18\/cit18","unstructured":"NIST Secure Hashing;NIST:Gaithersburg, MD;http:\/\/csrc.nist.gov\/groups\/ST\/toolkit\/secure_hashing.html(accessed July 11, 2011) ."},{"key":"ref19\/cit19","unstructured":"Taylor, T. T.; Chen, W. L.NEMA key based exact match searching. White paper;Symyx Technologies Inc.:San Ramon, CA, 2008; http:\/\/www.symyx.com\/products\/pdfs\/nema_whitepaper.pdf(accessed July 11, 2011)."},{"key":"ref20\/cit20","unstructured":"The IUPAC International Chemical Identifier (InChITM);IUPAC:Research Triangle Park, NC;http:\/\/www.iupac.org\/inchi(accessed July 11, 2011) ."},{"key":"ref21\/cit21","unstructured":"InChIKey Collision: Two isomers of spongistatin: One InChIKey;The Goodman Group, University of Cambridge:Cambridge, U.K.;http:\/\/www-jmg.ch.cam.ac.uk\/data\/inchi(accessed July 12, 2011) ."},{"key":"ref22\/cit22","unstructured":"Release Notes of IUPAC International Chemical Identifier (InChI): InChI version 1, software version 1.03, 2010."},{"key":"ref23\/cit23","unstructured":"UniProt, release 2011_07;European Bioinformatics Institute, Swiss Institute of Bioinformatics, and Protein Information Resource (Georgetown University Medical Center:Hinxton, U.K., Lausanne, Switzerland, and Washington, D.C.;ftp:\/\/ftp.uniprot.org\/pub\/databases\/uniprot\/current_release\/relnotes.txt(accessed July 12, 2011) ."},{"key":"ref24\/cit24","doi-asserted-by":"crossref","first-page":"545","DOI":"10.1021\/ci00014a004","volume":"33","author":"Christie B. D.","year":"1993","journal-title":"J. Chem. Inf. Comput. Sci."},{"key":"ref25\/cit25","unstructured":"Ptmlist.txt.http:\/\/www.uniprot.org\/docs\/ptmlist(accessed July 11, 2011) ."},{"key":"ref26\/cit26","unstructured":"Ziegler, P.; Dittrich, K. R.Three Decades of Data Integration - All Problems Solved?In18th IFIP World Computer Congress (WCC 2004),Toulouse, France,August 22\u201327, 2004;WCC:Toulouse, France, 2004; Building the Information Society, vol12, pp3\u201312."},{"key":"ref27\/cit27","unstructured":"P63232(M2_I73A5) reviewed, UniProtKB\/Swiss-Prot;http:\/\/www.uniprot.org\/uniprot\/P63232(accessed June 30, 2011) ."},{"key":"ref28\/cit28","unstructured":"Q463X4(M2_I72A3) reviewed, UniProtKB\/Swiss-Prot;http:\/\/www.uniprot.org\/uniprot\/Q463X4(accessed June 30, 2011) ."},{"key":"ref29\/cit29","first-page":"151","volume-title":"Proceedings, Third Annual ACM Symposium on the Theory of Computing","author":"Cook S. A.","year":"1971"},{"key":"ref31\/cit31","unstructured":"P04007(RNS2_NICAL) reviewed, UniProtKB\/Swiss-Prot;http:\/\/www.uniprot.org\/uniprot\/P04007(accessed July 12, 2011) ."},{"key":"ref32\/cit32","unstructured":"PubChem Download Service;http:\/\/pubchem.ncbi.nlm.nih.gov\/\/pc_fetch\/pc_fetch.cgi(accessed July 11, 2011)"},{"key":"ref33\/cit33","doi-asserted-by":"crossref","first-page":"217","DOI":"10.1111\/j.1432-1033.1990.tb19446.x","volume":"194","author":"Weil H.-P.","year":"1990","journal-title":"Eur. J. Biochem."},{"key":"ref34\/cit34","doi-asserted-by":"crossref","first-page":"1298","DOI":"10.1021\/jm1012853","volume":"54","author":"Mangoni M. L.","year":"2011","journal-title":"J. Med. Chem."},{"key":"ref35\/cit35","first-page":"388","volume":"13","author":"Pihl T. D.","year":"2010","journal-title":"IDrugs"},{"key":"ref36\/cit36","doi-asserted-by":"crossref","first-page":"3497","DOI":"10.1093\/nar\/gkg500","volume":"31","author":"Chenna R.","year":"2003","journal-title":"Nucleic Acids Res."}],"container-title":["Journal of Chemical Information and Modeling"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/pubs.acs.org\/doi\/pdf\/10.1021\/ci2001988","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,4,15]],"date-time":"2023-04-15T09:46:21Z","timestamp":1681551981000},"score":1,"resource":{"primary":{"URL":"https:\/\/pubs.acs.org\/doi\/10.1021\/ci2001988"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2011,8,22]]},"references-count":35,"journal-issue":{"issue":"9","published-print":{"date-parts":[[2011,9,26]]}},"alternative-id":["10.1021\/ci2001988"],"URL":"https:\/\/doi.org\/10.1021\/ci2001988","relation":{},"ISSN":["1549-9596","1549-960X"],"issn-type":[{"value":"1549-9596","type":"print"},{"value":"1549-960X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2011,8,22]]}}}