{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,26]],"date-time":"2025-06-26T09:32:01Z","timestamp":1750930321293,"version":"3.37.3"},"reference-count":60,"publisher":"American Chemical Society (ACS)","issue":"4","license":[{"start":{"date-parts":[[2021,3,22]],"date-time":"2021-03-22T00:00:00Z","timestamp":1616371200000},"content-version":"unspecified","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0\/"}],"funder":[{"DOI":"10.13039\/100000054","name":"National Cancer Institute","doi-asserted-by":"publisher","award":["HHSN261200800001E"],"award-info":[{"award-number":["HHSN261200800001E"]}],"id":[{"id":"10.13039\/100000054","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000049","name":"National Institute on Aging","doi-asserted-by":"publisher","award":["R01AD057555"],"award-info":[{"award-number":["R01AD057555"]}],"id":[{"id":"10.13039\/100000049","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000057","name":"National Institute of General Medical Sciences","doi-asserted-by":"publisher","award":["R01GM122845"],"award-info":[{"award-number":["R01GM122845"]}],"id":[{"id":"10.13039\/100000057","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["J. Chem. Inf. Model."],"published-print":{"date-parts":[[2021,4,26]]},"DOI":"10.1021\/acs.jcim.0c01285","type":"journal-article","created":{"date-parts":[[2021,3,24]],"date-time":"2021-03-24T00:12:37Z","timestamp":1616544757000},"page":"1570-1582","source":"Crossref","is-referenced-by-count":24,"title":["MSA-Regularized Protein Sequence Transformer toward Predicting Genome-Wide Chemical-Protein Interactions: Application to GPCRome Deorphanization"],"prefix":"10.1021","volume":"61","author":[{"given":"Tian","family":"Cai","sequence":"first","affiliation":[{"name":"Ph.D. Program in Computer Science, The Graduate Center, The City University of New York, New York, New York 10016, United States"}]},{"given":"Hansaim","family":"Lim","sequence":"additional","affiliation":[{"name":"Ph.D. Program in Biochemistry, The Graduate Center, The City University of New York, New York, New York 10016, United States"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9020-301X","authenticated-orcid":true,"given":"Kyra Alyssa","family":"Abbu","sequence":"additional","affiliation":[{"name":"Department of Computer Science, Hunter College, The City University of New York, New York, New York 10065, United States"}]},{"given":"Yue","family":"Qiu","sequence":"additional","affiliation":[{"name":"Ph.D. Program in Biology, The Graduate Center, The City University of New York, New York, New York 10016, United States"}]},{"given":"Ruth","family":"Nussinov","sequence":"additional","affiliation":[{"name":"Computational Structural Biology Section, Basic Science Program, Frederick National Laboratory for Cancer Research, Frederick, Maryland 21702, United States"},{"name":"Department of Human Molecular Genetics and Biochemistry, Sackler School of Medicine, Tel Aviv University, Tel Aviv 69978, Israel"}]},{"given":"Lei","family":"Xie","sequence":"additional","affiliation":[{"name":"Ph.D. Program in Computer Science, The Graduate Center, The City University of New York, New York, New York 10016, United States"},{"name":"Ph.D. Program in Biochemistry, The Graduate Center, The City University of New York, New York, New York 10016, United States"},{"name":"Department of Computer Science, Hunter College, The City University of New York, New York, New York 10065, United States"},{"name":"Ph.D. Program in Biology, The Graduate Center, The City University of New York, New York, New York 10016, United States"},{"name":"Helen and Robert Appel Alzheimer\u2019s Disease Research Institute, Feil Family Brain & Mind Research Institute, Weill Cornell Medicine, Cornell University, New York, New York 10021, United States"}]}],"member":"316","published-online":{"date-parts":[[2021,3,23]]},"reference":[{"key":"ref1\/cit1","doi-asserted-by":"publisher","DOI":"10.1007\/s00335-019-09809-0"},{"key":"ref2\/cit2","doi-asserted-by":"publisher","DOI":"10.1038\/nrd.2017.252"},{"key":"ref3\/cit3","doi-asserted-by":"publisher","DOI":"10.1016\/j.bcp.2018.02.016"},{"key":"ref4\/cit4","doi-asserted-by":"publisher","DOI":"10.1111\/bph.13452"},{"key":"ref5\/cit5","doi-asserted-by":"publisher","DOI":"10.1038\/s42256-020-0152-y"},{"key":"ref6\/cit6","doi-asserted-by":"publisher","DOI":"10.1093\/nar\/gku973"},{"key":"ref7\/cit7","doi-asserted-by":"publisher","DOI":"10.1109\/TCBB.2016.2570211"},{"key":"ref8\/cit8","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pcbi.1005135"},{"key":"ref9\/cit9","doi-asserted-by":"publisher","DOI":"10.1038\/srep38860"},{"key":"ref10\/cit10","doi-asserted-by":"publisher","DOI":"10.1021\/acs.jproteome.6b00618"},{"key":"ref11\/cit11","first-page":"3371","volume-title":"Proceedings of the Twenty-Seventh International Joint Conference on Artificial Intelligence, IJCAI-18","author":"Gao K. Y.","year":"2018"},{"key":"ref12\/cit12","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btaa921"},{"key":"ref13\/cit13","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pcbi.1007129"},{"key":"ref14\/cit14","unstructured":"Sutskever, I.; Vinyals, O.; Le, Q. Sequence to Sequence Learning with Neural Networks, 2014; pp 10; https:\/\/arxiv.org\/abs\/1409.3215v3."},{"key":"ref15\/cit15","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btz111"},{"key":"ref16\/cit16","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btaa524"},{"key":"ref17\/cit17","unstructured":"Lan, Z.; Chen, M.; Goodman, S.; Gimpel, K.; Sharma, P.; Soricut, R. ALBERT: A Lite BERT for Self-supervised Learning of Language Representations, 2019; https:\/\/arxiv.org\/abs\/1909.11942."},{"key":"ref18\/cit18","doi-asserted-by":"crossref","unstructured":"Rao, R.; Bhattacharya, N.; Thomas, N.; Duan, Y.; Chen, X.; Canny, J. F.; Abbeel, P.; Song, Y. S.Evaluating Protein Transfer Learning with TAPE.  CoRR, abs\/1906.08230, 2019.","DOI":"10.1101\/676825"},{"key":"ref19\/cit19","unstructured":"Bepler, T.; Berger, B. Learning protein sequence embeddings using information from structure CoRR, abs\/1902.08661, 2019."},{"key":"ref20\/cit20","unstructured":"Min, S.; Park, S.; Kim, S.; Choi, H. S.; Yoon, S. Pre-Training of Deep Bidirectional Protein Sequence Representations with Structural Information, 2019; https:\/\/arxiv.org\/abs\/1912.05625."},{"key":"ref21\/cit21","doi-asserted-by":"publisher","DOI":"10.1038\/nrd.2017.178"},{"key":"ref22\/cit22","doi-asserted-by":"publisher","DOI":"10.1093\/nar\/gky995"},{"key":"ref23\/cit23","doi-asserted-by":"publisher","DOI":"10.1093\/nar\/gkr777"},{"key":"ref24\/cit24","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/18.1.130"},{"key":"ref25\/cit25","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btv302"},{"key":"ref26\/cit26","doi-asserted-by":"publisher","DOI":"10.1093\/nar\/gkj067"},{"key":"ref27\/cit27","unstructured":"Duvenaud, D.; Maclaurin, D.; Iparraguirre, J.; Bombarell, R.; Hirzel, T.; Aspuru-Guzik, A.; Adams, R. Convolutional Networks on Graphs for Learning Molecular Fingerprints, 2015; pp 2224\u20132232 https:\/\/arxiv.org\/abs\/1509.09292."},{"key":"ref28\/cit28","unstructured":"dos Santos, C. N.; Tan, M.; Xiang, B.; Zhou, B. Attentive Pooling Networks CoRR, abs\/1602.03609, 2016."},{"key":"ref29\/cit29","first-page":"4171","volume-title":"Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Vol. 1 (Long and Short Papers)","author":"Devlin K.","year":"2019"},{"key":"ref30\/cit30","unstructured":"Lundberg, S.; Lee, S.I. A Unified Approach to Interpreting Model Predictions, 2017; https:\/\/arxiv.org\/abs\/1705.07874."},{"key":"ref31\/cit31","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.0435715100"},{"key":"ref32\/cit32","doi-asserted-by":"publisher","DOI":"10.2174\/092986712799320556"},{"key":"ref33\/cit33","doi-asserted-by":"publisher","DOI":"10.1038\/s41594-017-0011-7"},{"key":"ref34\/cit34","doi-asserted-by":"publisher","DOI":"10.1016\/j.mce.2016.11.023"},{"key":"ref35\/cit35","doi-asserted-by":"publisher","DOI":"10.1016\/j.tips.2010.10.001"},{"key":"ref36\/cit36","doi-asserted-by":"publisher","DOI":"10.1016\/j.bcp.2013.03.005"},{"key":"ref37\/cit37","doi-asserted-by":"publisher","DOI":"10.1021\/ja508394x"},{"key":"ref38\/cit38","doi-asserted-by":"publisher","DOI":"10.1111\/nyas.14192"},{"key":"ref39\/cit39","doi-asserted-by":"crossref","unstructured":"Rives, A.; Goyal, S.; Meier, J.; Guo, D.; Ott, M.; Zitnick, C.; Ma, J.; Fergus, R. Biological Structure and Function Emerge from Scaling Unsupervised Learning to 250 Million Protein Sequences.  bioRxiv  622803, 2019.","DOI":"10.1101\/622803"},{"key":"ref40\/cit40","doi-asserted-by":"crossref","unstructured":"He, K.; Zhang, X.; Ren, S.; Sun, J. Deep Residual Learning for Image Recognition CoRR, abs\/1512.03385, 2015.","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref41\/cit41","unstructured":"Duvenaud, D.; Maclaurin, D.; Iparraguirre, J.; Bombarell, R.; Hirzel, T.; Aspuru-Guzik, A.; Adams, R. Convolutional Networks on Graphs for Learning Molecular Fingerprints, 2015, pp 2224\u20132232; https:\/\/arxiv.org\/abs\/1509.09292."},{"key":"ref42\/cit42","unstructured":"Howard, J.; Ruder, S. Universal Language Model Fine-tuning for Text Classification, 2018; pp 328\u2013339; https:\/\/arxiv.org\/abs\/1801.06146."},{"key":"ref43\/cit43","unstructured":"Vaswani, A.; Shazeer, N.; Parmar, N.; Uszkoreit, J.; Jones, L.; Gomez, A.; Kaiser, L.; Polosukhin, I. Attention Is All You Need, 2017; https:\/\/arxiv.org\/abs\/1706.03762."},{"key":"ref44\/cit44","doi-asserted-by":"publisher","DOI":"10.1007\/s10462-020-09838-1"},{"key":"ref45\/cit45","doi-asserted-by":"publisher","DOI":"10.1093\/nar\/25.17.3389"},{"key":"ref46\/cit46","unstructured":"Kohavi, R. A Study of Cross-Validation and Bootstrap for Accuracy Estimation and Model Selection. Morgan Kaufmann, 1995; pp 1137\u20131143; https:\/\/dl.acm.org\/doi\/10.5555\/1643031.1643047."},{"key":"ref47\/cit47","first-page":"1","volume-title":"2017 IEEE International Conference on INnovations in Intelligent SysTems and Applications (INISTA)","author":"Leon F.","year":"2017"},{"key":"ref48\/cit48","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/bty633"},{"key":"ref49\/cit49","doi-asserted-by":"publisher","DOI":"10.1093\/molbev\/msz240"},{"key":"ref50\/cit50","doi-asserted-by":"publisher","DOI":"10.1111\/2041-210X.12628"},{"key":"ref51\/cit51","doi-asserted-by":"publisher","DOI":"10.1093\/molbev\/msy194"},{"key":"ref52\/cit52","unstructured":"Bahdanau, D.; Cho, K.; Bengio, Y. Neural Machine Translation by Jointly Learning to Align and Translate, 2014; https:\/\/arxiv.org\/abs\/1409.0473."},{"key":"ref53\/cit53","unstructured":"Liu, Y.; Ott, M.; Goyal, N.; Du, J.; Joshi, M.; Chen, D.; Levy, O.; Lewis, M.; Zettlemoyer, L.; Stoyanov, V. RoBERTa: A Robustly Optimized BERT Pretraining Approach, 2019; https:\/\/arxiv.org\/abs\/1907.11692."},{"key":"ref54\/cit54","doi-asserted-by":"crossref","unstructured":"Elnaggar, A.; Heinzinger, M.; Dallago, C.; Rihawi, G.; Wang, Y.; Jones, L.; Gibbs, T.; Feher, T.; Angerer, C.; Steinegger, M.; Bhowmik, D.; Rost, B. ProtTrans: Towards Cracking the Language of Life\u2019s Code Through Self-Supervised Deep Learning and High Performance Computing, 2020; https:\/\/arxiv.org\/abs\/2007.06225.","DOI":"10.1101\/2020.07.12.199554"},{"key":"ref55\/cit55","doi-asserted-by":"publisher","DOI":"10.1101\/622803"},{"key":"ref56\/cit56","doi-asserted-by":"crossref","unstructured":"Rao, R.; Bhattacharya, N.; Thomas, N.; Duan, Y.; Chen, X.; Canny, J.; Abbeel, P.; Song, Y. S. Evaluating Protein Transfer Learning with TAPE, 2019; https:\/\/arxiv.org\/abs\/1906.08230.","DOI":"10.1101\/676825"},{"key":"ref57\/cit57","doi-asserted-by":"publisher","DOI":"10.1093\/nar\/gkaa1080"},{"key":"ref58\/cit58","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btaa524"},{"key":"ref59\/cit59","doi-asserted-by":"publisher","DOI":"10.1101\/676825"},{"key":"ref60\/cit60","doi-asserted-by":"publisher","DOI":"10.1016\/j.compbiolchem.2019.107140"}],"container-title":["Journal of Chemical Information and Modeling"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/pubs.acs.org\/doi\/pdf\/10.1021\/acs.jcim.0c01285","content-type":"application\/pdf","content-version":"vor","intended-application":"unspecified"},{"URL":"https:\/\/pubs.acs.org\/doi\/pdf\/10.1021\/acs.jcim.0c01285","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,4,27]],"date-time":"2023-04-27T08:31:11Z","timestamp":1682584271000},"score":1,"resource":{"primary":{"URL":"https:\/\/pubs.acs.org\/doi\/10.1021\/acs.jcim.0c01285"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,3,23]]},"references-count":60,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2021,4,26]]}},"alternative-id":["10.1021\/acs.jcim.0c01285"],"URL":"https:\/\/doi.org\/10.1021\/acs.jcim.0c01285","relation":{},"ISSN":["1549-9596","1549-960X"],"issn-type":[{"type":"print","value":"1549-9596"},{"type":"electronic","value":"1549-960X"}],"subject":[],"published":{"date-parts":[[2021,3,23]]}}}