{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T03:20:55Z","timestamp":1740108055416,"version":"3.37.3"},"reference-count":46,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2023,2,18]],"date-time":"2023-02-18T00:00:00Z","timestamp":1676678400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,2,18]],"date-time":"2023-02-18T00:00:00Z","timestamp":1676678400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Pattern Anal Applic"],"published-print":{"date-parts":[[2023,8]]},"DOI":"10.1007\/s10044-023-01141-3","type":"journal-article","created":{"date-parts":[[2023,2,19]],"date-time":"2023-02-19T10:24:42Z","timestamp":1676802282000},"page":"1161-1170","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Weighted edit distance optimized using genetic algorithm for SMILES-based compound similarity"],"prefix":"10.1007","volume":"26","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-4986-9757","authenticated-orcid":false,"given":"In-Hyuk","family":"Choi","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8823-0438","authenticated-orcid":false,"given":"Il-Seok","family":"Oh","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,2,18]]},"reference":[{"issue":"2","key":"1141_CR1","doi-asserted-by":"publisher","first-page":"337","DOI":"10.1006\/jmbi.1999.3371","volume":"295","author":"H Gohlke","year":"2000","unstructured":"Gohlke H, Hendlich M, Klebe G (2000) Knowledge-based scoring function to predict protein-ligand interactions. J Mol Biol 295(2):337\u2013356. https:\/\/doi.org\/10.1006\/jmbi.1999.3371","journal-title":"J Mol Biol"},{"issue":"18","key":"1141_CR2","doi-asserted-by":"publisher","first-page":"487","DOI":"10.1093\/bioinformatics\/bts412","volume":"28","author":"Y Tabei","year":"2012","unstructured":"Tabei Y, Pauwels E, Stoven V, Takemoto K, Yamanishi Y (2012) Identification of chemogenomic features from drug\u2013target interaction networks using interpretable classifiers. Bioinformatics 28(18):487\u2013494","journal-title":"Bioinformatics"},{"issue":"11\u201312","key":"1141_CR3","doi-asserted-by":"publisher","first-page":"719","DOI":"10.1002\/minf.201400066","volume":"33","author":"R Sawada","year":"2014","unstructured":"Sawada R, Kotera M, Yamanishi Y (2014) Benchmarking a wide range of chemical descriptors for drug-target interaction prediction using a chemogenomic approach. Mol Inf 33(11\u201312):719\u2013731","journal-title":"Mol Inf"},{"issue":"6","key":"1141_CR4","doi-asserted-by":"publisher","first-page":"983","DOI":"10.1021\/ci9800211","volume":"38","author":"P Willett","year":"1998","unstructured":"Willett P, Barnard JM, Downs GM (1998) Chemical similarity searching. J Chem Inf Comput Sci 38(6):983\u2013996","journal-title":"J Chem Inf Comput Sci"},{"issue":"2","key":"1141_CR5","doi-asserted-by":"publisher","first-page":"295","DOI":"10.1021\/ci990263g","volume":"40","author":"A Schuffenhauer","year":"2000","unstructured":"Schuffenhauer A, Gillet VJ, Willett P (2000) Similarity searching in files of three-dimensional chemical structures: analysis of the bioster database using two-dimensional fingerprints and molecular field descriptors. J Chem Inf Comput Sci 40(2):295\u2013307","journal-title":"J Chem Inf Comput Sci"},{"issue":"18","key":"1141_CR6","doi-asserted-by":"publisher","first-page":"1628","DOI":"10.2174\/156802608786786598","volume":"8","author":"AM Helguera","year":"2008","unstructured":"Helguera AM, Combes RD, Gonz\u00e1lez MP, Cordeiro M (2008) Applications of 2d descriptors in drug design: a dragon tale. Curr Top Med Chem 8(18):1628\u20131655","journal-title":"Curr Top Med Chem"},{"issue":"7","key":"1141_CR7","doi-asserted-by":"publisher","first-page":"1337","DOI":"10.1021\/ci800038f","volume":"48","author":"H Hong","year":"2008","unstructured":"Hong H, Xie Q, Ge W, Qian F, Fang H, Shi L, Su Z, Perkins R, Tong W (2008) Mold2, molecular descriptors from 2d structures for chemoinformatics and toxicoinformatics. J Chem Inf Model 48(7):1337\u20131344","journal-title":"J Chem Inf Model"},{"issue":"2","key":"1141_CR8","doi-asserted-by":"publisher","first-page":"327","DOI":"10.1021\/ci300445e","volume":"53","author":"DC Kombo","year":"2013","unstructured":"Kombo DC, Tallapragada K, Jain R, Chewning J, Mazurov AA, Speake JD, Hauser TA, Toler S (2013) 3d molecular descriptors important for clinical success. J Chem Inf Model 53(2):327\u2013342","journal-title":"J Chem Inf Model"},{"issue":"1","key":"1141_CR9","doi-asserted-by":"publisher","first-page":"31","DOI":"10.1021\/ci00057a005","volume":"28","author":"D Weininger","year":"1998","unstructured":"Weininger D (1998) Smiles, a chemical language and information system. 1. Introduction to methodology and encoding rules. J Chem Inf Comput Sci 28(1):31\u201336. https:\/\/doi.org\/10.1021\/ci00057a005","journal-title":"J Chem Inf Comput Sci"},{"issue":"2","key":"1141_CR10","doi-asserted-by":"publisher","first-page":"97","DOI":"10.1021\/ci00062a008","volume":"29","author":"D Weininger","year":"1989","unstructured":"Weininger D, Weininger A, Weininger JL (1989) Smiles. 2. Algorithm for generation of unique smiles notation. J Chem Inf Comput Sci 29(2):97\u2013101. https:\/\/doi.org\/10.1021\/ci00062a008","journal-title":"J Chem Inf Comput Sci"},{"key":"1141_CR11","doi-asserted-by":"publisher","DOI":"10.1186\/s12859-016-0977-x","author":"H \u00d6zt\u00fcrk","year":"2016","unstructured":"\u00d6zt\u00fcrk H, Ozkirimli E, \u00d6zg\u00fcr A (2016) A comparative study of SMILES-based compound similarity functions for drug-target interaction prediction. BMC Bioinform. https:\/\/doi.org\/10.1186\/s12859-016-0977-x","journal-title":"BMC Bioinform"},{"issue":"8","key":"1141_CR12","first-page":"707","volume":"10","author":"VI Levenshtein","year":"1996","unstructured":"Levenshtein VI (1996) Binary codes capable of correcting deletions, insertions, and reversals. Sov Phys Doklady 10(8):707\u2013710","journal-title":"Sov Phys Doklady"},{"issue":"2","key":"1141_CR13","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/1376815.1376819","volume":"2","author":"A Islam","year":"2008","unstructured":"Islam A, Inkpen D (2008) Semantic text similarity using corpus-based word similarity and string similarity. ACM Trans Knowl Discov Data 2(2):1\u201325","journal-title":"ACM Trans Knowl Discov Data"},{"issue":"1\u20132","key":"1141_CR14","doi-asserted-by":"publisher","first-page":"141","DOI":"10.1080\/1062936X.2011.645874","volume":"23","author":"DS Cao","year":"2012","unstructured":"Cao DS, Zhao JC, Yang YN, Zhao CX, Yan J, Liu S, Hu QN, Xu QS, Liang YZ (2012) In silico toxicity prediction by support vector machine and smiles representation-based string kernel. SAR QSAR Environ Res 23(1\u20132):141\u2013153","journal-title":"SAR QSAR Environ Res"},{"issue":"8","key":"1141_CR15","doi-asserted-by":"publisher","first-page":"1979","DOI":"10.1021\/ci400206h","volume":"53","author":"J Schwartz","year":"2013","unstructured":"Schwartz J, Awale M, Reymond JL (2013) Smifp (smiles fingerprint) chemical space for virtual screening and visualization of large databases of organic molecules. J Chem Inf Model 53(8):1979\u20131989. https:\/\/doi.org\/10.1021\/ci400206h","journal-title":"J Chem Inf Model"},{"key":"1141_CR16","volume-title":"An adventure in non-euclidean geometry","author":"EF Krause","year":"1986","unstructured":"Krause EF (1986) An adventure in non-euclidean geometry. Dover Publication, New York"},{"key":"1141_CR17","doi-asserted-by":"publisher","DOI":"10.1021\/ci0496797","author":"D Vidal","year":"2005","unstructured":"Vidal D, Thormann M, Pons M (2005) LINGO, an efficient holographic text based method to calculate biophysical properties and intermolecular similarities. J Chem Inf Model. https:\/\/doi.org\/10.1021\/ci0496797","journal-title":"J Chem Inf Model"},{"issue":"4","key":"1141_CR18","doi-asserted-by":"publisher","first-page":"309","DOI":"10.1147\/rd.14.0309","volume":"1","author":"HP Luhn","year":"1957","unstructured":"Luhn HP (1957) A statistical approach to mechanized encoding and searching of literary information. IBM J Res Dev 1(4):309\u2013317. https:\/\/doi.org\/10.1147\/rd.14.0309","journal-title":"IBM J Res Dev"},{"key":"1141_CR19","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1108\/eb026526","volume":"28","author":"KS Jones","year":"1972","unstructured":"Jones KS (1972) A statistical interpretation of term specificity and its application in retrieval. J Doc 28:11\u201321","journal-title":"J Doc"},{"key":"1141_CR20","doi-asserted-by":"publisher","DOI":"10.1093\/bib\/bbz157","author":"M Bagherian","year":"2020","unstructured":"Bagherian M, Sabeti E, Wang K et al (2020) Machine learning approaches and databases for prediction of drug\u2013target interaction: a survey paper. Brief Bioinform. https:\/\/doi.org\/10.1093\/bib\/bbz157","journal-title":"Brief Bioinform"},{"key":"1141_CR21","doi-asserted-by":"publisher","DOI":"10.1016\/j.jbi.2019.103159","author":"K Sachdev","year":"2019","unstructured":"Sachdev K, Gupta MK (2019) A comprehensive review of feature based methods for drug target interaction prediction. J Biomed Inform. https:\/\/doi.org\/10.1016\/j.jbi.2019.103159","journal-title":"J Biomed Inform"},{"key":"1141_CR22","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btz111","author":"M Karimi","year":"2019","unstructured":"Karimi M, Wu D, Wang Z et al (2019) DeepAffinity: interpretable deep learning of compound\u2013protein affinity through unified recurrent and convolutional neural networks. Bioinformatics. https:\/\/doi.org\/10.1093\/bioinformatics\/btz111","journal-title":"Bioinformatics"},{"issue":"6","key":"1141_CR23","doi-asserted-by":"publisher","first-page":"e100719","DOI":"10.1371\/journal.pcbi.1007129","volume":"15","author":"I Lee","year":"2019","unstructured":"Lee I, Keum J, Nam H (2019) DeepConv-DTI: prediction of drug-target interactions via deep learning with convolution on protein sequences. PLoS Comput Biol 15(6):e100719. https:\/\/doi.org\/10.1371\/journal.pcbi.1007129","journal-title":"PLoS Comput Biol"},{"key":"1141_CR24","doi-asserted-by":"publisher","DOI":"10.1021\/acs.jcim.9b00387","author":"J Lim","year":"2019","unstructured":"Lim J, Ryu S, Park K et al (2019) Predicting drug\u2013target interaction using a novel graph neural network with 3D structure-embedded graph representation. J Chem Inf Model. https:\/\/doi.org\/10.1021\/acs.jcim.9b00387","journal-title":"J Chem Inf Model"},{"key":"1141_CR25","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btaa880","author":"K Huang","year":"2020","unstructured":"Huang K, Xiao C, Glass LM et al (2020) MolTrans: molecular Interaction Transformer for drug\u2013target interaction prediction. Bioinformatics. https:\/\/doi.org\/10.1093\/bioinformatics\/btaa880","journal-title":"Bioinformatics"},{"key":"1141_CR26","doi-asserted-by":"publisher","DOI":"10.2174\/0929867326666190808154841","author":"C Wang","year":"2020","unstructured":"Wang C, Kurgan L (2020) Survey of similarity-based prediction of drug-protein interactions. Curr Med Chem. https:\/\/doi.org\/10.2174\/0929867326666190808154841","journal-title":"Curr Med Chem"},{"issue":"13","key":"1141_CR27","doi-asserted-by":"publisher","first-page":"232","DOI":"10.1093\/bioinformatics\/btn162","volume":"24","author":"Y Yamanishi","year":"2008","unstructured":"Yamanishi Y, Araki M, Gutteridge A, Honda W, Kanehisa M (2008) Prediction of drug-target interaction networks from the integration of chemical and genomic spaces. Bioinformatics 24(13):232\u2013240. https:\/\/doi.org\/10.1093\/bioinformatics\/btn162","journal-title":"Bioinformatics"},{"key":"1141_CR28","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btp433","author":"K Bleakley","year":"2009","unstructured":"Bleakley K, Yamanishi Y (2009) Supervised prediction of drug\u2013target interactions using bipartite local models. Bioinformatics. https:\/\/doi.org\/10.1093\/bioinformatics\/btp433","journal-title":"Bioinformatics"},{"key":"1141_CR29","doi-asserted-by":"publisher","DOI":"10.1093\/bib\/bbab275","author":"Q An","year":"2021","unstructured":"An Q, Yu L (2021) A heterogeneous network embedding framework for predicting similarity-based drug-target interactions. Brief Bioinform. https:\/\/doi.org\/10.1093\/bib\/bbab275","journal-title":"Brief Bioinform"},{"key":"1141_CR30","doi-asserted-by":"publisher","unstructured":"Zheng X, Ding H, Mamitsuka H et al (2013) Collaborative matrix factorization with multiple similarities for predicting drug-target. https:\/\/doi.org\/10.1145\/2487575.2487670","DOI":"10.1145\/2487575.2487670"},{"key":"1141_CR31","doi-asserted-by":"publisher","DOI":"10.1109\/TCBB.2016.2530062","author":"A Ezzat","year":"2017","unstructured":"Ezzat A, Zhao P, Wu M et al (2017) Drug\u2013target interaction prediction with graph regularized matrix factorization. IEEE\/ACM Trans Comput Biol Bioinform. https:\/\/doi.org\/10.1109\/TCBB.2016.2530062","journal-title":"IEEE\/ACM Trans Comput Biol Bioinform"},{"key":"1141_CR32","doi-asserted-by":"publisher","DOI":"10.1016\/j.jcmds.2022.100044","author":"P V\u00e4th","year":"2022","unstructured":"V\u00e4th P, M\u00fcnch M, Raab C et al (2022) PROVAL: a framework for comparison of protein sequence embeddings. J Comput Math Data Sci. https:\/\/doi.org\/10.1016\/j.jcmds.2022.100044","journal-title":"J Comput Math Data Sci"},{"key":"1141_CR33","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.1967.1053964","author":"T Cover","year":"1967","unstructured":"Cover T, Hart P (1967) Nearest neighbor pattern classification. IEEE Trans Inf Theory. https:\/\/doi.org\/10.1109\/TIT.1967.1053964","journal-title":"IEEE Trans Inf Theory"},{"key":"1141_CR34","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.1982.1056489","author":"S Lloyd","year":"1982","unstructured":"Lloyd S (1982) Least squares quantization in PCM. IEEE Trans Inf Theory. https:\/\/doi.org\/10.1109\/TIT.1982.1056489","journal-title":"IEEE Trans Inf Theory"},{"key":"1141_CR35","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0059401","author":"M Biehl","year":"2013","unstructured":"Biehl M, Bunte K, Schneider P (2013) Analysis of flow cytometry data by matrix relevance learning vector quantization. PLoS ONE. https:\/\/doi.org\/10.1371\/journal.pone.0059401","journal-title":"PLoS ONE"},{"key":"1141_CR36","doi-asserted-by":"publisher","DOI":"10.1016\/j.neunet.2011.12.003","author":"S Kirstein","year":"2012","unstructured":"Kirstein S, Wersing H, Gross H-M et al (2012) A life-long learning vector quantization approach for interactive learning of multiple categories. Neural Netw. https:\/\/doi.org\/10.1016\/j.neunet.2011.12.003","journal-title":"Neural Netw"},{"key":"1141_CR37","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2013.09.048","author":"A Backhaus","year":"2014","unstructured":"Backhaus A, Seiffert U (2014) Classification in high-dimensional spectral data: accuracy vs. interpretability vs. model size. Neurocomputing. https:\/\/doi.org\/10.1016\/j.neucom.2013.09.048","journal-title":"Neurocomputing"},{"key":"1141_CR38","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2013.05.054","author":"B Hammer","year":"2014","unstructured":"Hammer B, Hofmann D, Schleif F-M et al (2014) Learning vector quantization for (dis-)similarities. Neurocomputing. https:\/\/doi.org\/10.1016\/j.neucom.2013.05.054","journal-title":"Neurocomputing"},{"key":"1141_CR39","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2014.11.082","author":"B Mokbel","year":"2015","unstructured":"Mokbel B, Paassen B, Schleif F-M et al (2015) Metric learning for sequences in relational LVQ. Neurocomputing. https:\/\/doi.org\/10.1016\/j.neucom.2014.11.082","journal-title":"Neurocomputing"},{"key":"1141_CR40","doi-asserted-by":"publisher","unstructured":"Zhang S, Hu Y, Bian G (2017) Research on string similarity algorithm based on Levenshtein Distance. https:\/\/doi.org\/10.1109\/IAEAC.2017.8054419","DOI":"10.1109\/IAEAC.2017.8054419"},{"key":"1141_CR41","unstructured":"Mikolov T, Chen K, Corrado G et al (2013) Efficient estimation of word representations in vector space. https:\/\/arxiv.org\/abs\/1301.3781"},{"key":"1141_CR42","doi-asserted-by":"publisher","DOI":"10.1186\/s13321-021-00552-w","author":"MA Thafar","year":"2021","unstructured":"Thafar MA, Olayan RS, Albaradei S et al (2021) DTi2Vec: drug\u2013target interaction prediction using network embedding and ensemble learning. J Cheminform. https:\/\/doi.org\/10.1186\/s13321-021-00552-w","journal-title":"J Cheminform"},{"key":"1141_CR43","volume-title":"Cormen, introduction algorithms","author":"H Thomas","year":"2009","unstructured":"Thomas H (2009) Cormen, introduction algorithms, 3rd edn. MIT Press, Cambridge","edition":"3"},{"issue":"6","key":"1141_CR44","doi-asserted-by":"publisher","first-page":"66952","DOI":"10.1371\/journal.pone.0066952","volume":"8","author":"T van Laarhoven","year":"2013","unstructured":"van Laarhoven T, Marchiori E (2013) Predicting drug-target interactions for new drug compounds using a weighted nearest neighbor profile. PLoS ONE 8(6):66952. https:\/\/doi.org\/10.1371\/journal.pone.0066952","journal-title":"PLoS ONE"},{"key":"1141_CR45","unstructured":"Ruder S (2016) An overview of gradient descent optimization algorithms. https:\/\/arxiv.org\/abs\/1609.04747"},{"key":"1141_CR46","doi-asserted-by":"publisher","DOI":"10.1007\/s11042-020-10139-6","author":"S Katoch","year":"2020","unstructured":"Katoch S, Chauhan SS, Kumar V (2020) A review on genetic algorithm: past, present, and future. Multimed Tools Appl. https:\/\/doi.org\/10.1007\/s11042-020-10139-6","journal-title":"Multimed Tools Appl"}],"container-title":["Pattern Analysis and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10044-023-01141-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10044-023-01141-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10044-023-01141-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,7,22]],"date-time":"2023-07-22T14:02:09Z","timestamp":1690034529000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10044-023-01141-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,2,18]]},"references-count":46,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2023,8]]}},"alternative-id":["1141"],"URL":"https:\/\/doi.org\/10.1007\/s10044-023-01141-3","relation":{},"ISSN":["1433-7541","1433-755X"],"issn-type":[{"type":"print","value":"1433-7541"},{"type":"electronic","value":"1433-755X"}],"subject":[],"published":{"date-parts":[[2023,2,18]]},"assertion":[{"value":"13 April 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"24 January 2023","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 February 2023","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors did not receive support from any organization for the submitted work. And all authors certify that they have no affiliations with or involvement in any organization or entity with any financial interest or non-financial interest in the subject matter or materials discussed in this manuscript.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}