{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,11]],"date-time":"2025-09-11T19:18:18Z","timestamp":1757618298670,"version":"3.44.0"},"reference-count":57,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2025,6,10]],"date-time":"2025-06-10T00:00:00Z","timestamp":1749513600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,6,10]],"date-time":"2025-06-10T00:00:00Z","timestamp":1749513600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Science Foundation of China","doi-asserted-by":"crossref","award":["61972066"],"award-info":[{"award-number":["61972066"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Data Min Knowl Disc"],"published-print":{"date-parts":[[2025,7]]},"DOI":"10.1007\/s10618-025-01113-7","type":"journal-article","created":{"date-parts":[[2025,6,10]],"date-time":"2025-06-10T09:45:21Z","timestamp":1749548721000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Hamming encoder: mining discriminative k-mers for discrete sequence classification"],"prefix":"10.1007","volume":"39","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8267-9181","authenticated-orcid":false,"given":"Dong","family":"Junjie","sequence":"first","affiliation":[]},{"given":"Jiang","family":"Mudi","sequence":"additional","affiliation":[]},{"given":"Hu","family":"Lianyu","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9526-8816","authenticated-orcid":false,"given":"He","family":"Zengyou","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,6,10]]},"reference":[{"key":"1113_CR1","unstructured":"Anticancer peptides (2019) UCI Machine Learning Repository. https:\/\/archive.ics.uci.edu\/dataset\/589\/anticancer+peptides"},{"key":"1113_CR2","unstructured":"Bengio Y, L\u00e9onard N, Courville A (2013) Estimating or propagating gradients through stochastic neurons for conditional computation. arXiv preprint arXiv:1308.3432"},{"key":"1113_CR3","doi-asserted-by":"crossref","unstructured":"Bulat A, Martinez B, Tzimiropoulos G (2020) Bats: binary architecture search. In: Proceedings of the 2020 European conference on computer vision, Springer, pp 309\u2013325.","DOI":"10.1007\/978-3-030-58592-1_19"},{"key":"1113_CR4","unstructured":"Bulat A, Tzimiropoulos G (2019) Xnor-net++: improved binary neural networks. arXiv preprint arXiv:1909.13863"},{"key":"1113_CR5","unstructured":"Chen S, Wang W, Pan SJ (2019) Metaquant: learning to quantize by learning to penetrate non-differentiable quantization. In: Proceedings of the 33rd international conference on neural information processing systems, pp 3916\u20133926"},{"issue":"2","key":"1113_CR6","doi-asserted-by":"publisher","first-page":"139","DOI":"10.1093\/bioinformatics\/14.2.139","volume":"14","author":"NA Chuzhanova","year":"1998","unstructured":"Chuzhanova NA, Jones AJ, Margetts S (1998) Feature selection for genetic sequence classification. Bioinformatics 14(2):139\u2013143","journal-title":"Bioinformatics"},{"key":"1113_CR7","unstructured":"Collery M, Bonnard P, Fages F, Kusters R (2023) Neural-based classification rule learning for sequential data. In: Proceedings of the 11th international conference on learning representations"},{"issue":"6","key":"1113_CR8","doi-asserted-by":"publisher","first-page":"1130","DOI":"10.1109\/TKDE.2019.2897311","volume":"32","author":"J De Smedt","year":"2020","unstructured":"De Smedt J, Deeva G, De Weerdt J (2020) Mining behavioral sequence constraints for classification. IEEE Trans Knowl Data Eng 32(6):1130\u20131142","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"1113_CR9","first-page":"1","volume":"7","author":"J Dem\u0161ar","year":"2006","unstructured":"Dem\u0161ar J (2006) Statistical comparisons of classifiers over multiple data sets. J Mach Learn Res 7:1\u201330","journal-title":"J Mach Learn Res"},{"key":"1113_CR10","doi-asserted-by":"crossref","unstructured":"Di\u00a0Ciccio C, Mecella M (2013) A two-step fast algorithm for the automated discovery of declarative workflows. In: Proceedings of the 2013 IEEE symposium on computational intelligence and data mining (CIDM), IEEE, pp 135\u2013142","DOI":"10.1109\/CIDM.2013.6597228"},{"issue":"1","key":"1113_CR11","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1007\/s10115-016-1002-4","volume":"52","author":"E Egho","year":"2017","unstructured":"Egho E, Gay D, Boull\u00e9 M, Voisine N, Cl\u00e9rot F (2017) A user parameter-free approach for mining robust sequential classification rules. Knowl Inf Syst 52(1):53\u201381","journal-title":"Knowl Inf Syst"},{"issue":"3","key":"1113_CR12","doi-asserted-by":"publisher","first-page":"467","DOI":"10.1016\/j.datak.2008.05.007","volume":"66","author":"TP Exarchos","year":"2008","unstructured":"Exarchos TP, Tsipouras MG, Papaloukas C, Fotiadis DI (2008) A two-stage methodology for sequence classification based on sequential pattern mining and optimization. Data & Knowl Eng 66(3):467\u2013487","journal-title":"Data & Knowl Eng"},{"key":"1113_CR13","doi-asserted-by":"publisher","first-page":"240","DOI":"10.1007\/978-3-030-46150-8_15","volume-title":"Machine learning and knowledge discovery in databases","author":"L Feremans","year":"2020","unstructured":"Feremans L, Vercruyssen V, Cule B, Meert W, Goethals B (2020) Pattern-based anomaly detection in mixed-type time series. In: Brefeld U, Fromont E, Hotho A, Knobbe A, Maathuis M, Robardet C (eds) Machine learning and knowledge discovery in databases. Springer, Cham, pp 240\u2013256"},{"key":"1113_CR14","doi-asserted-by":"crossref","unstructured":"Fischer J, Vreeken J (2021) Differentiable pattern set mining. In: Proceedings of the 27th ACM SIGKDD conference on knowledge discovery & data mining, pp 383\u2013392","DOI":"10.1145\/3447548.3467348"},{"key":"1113_CR15","doi-asserted-by":"publisher","DOI":"10.3389\/frai.2022.868085","volume":"5","author":"S Ghosh","year":"2022","unstructured":"Ghosh S, Yadav S, Wang X, Chakrabarty B, Kadio\u011flu S (2022) Dichotomic pattern mining integrated with constraint reasoning for digital behavior analysis. Front Artif Intell 5:868085","journal-title":"Front Artif Intell"},{"key":"1113_CR16","unstructured":"Gong Y, Liu L, Yang M, Bourdev L (2014) Compressing deep convolutional networks using vector quantization. arXiv preprint arXiv:1412.6115"},{"key":"1113_CR17","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s40854-020-00205-1","volume":"6","author":"A Gupta","year":"2020","unstructured":"Gupta A, Dengre V, Kheruwala HA, Shah M (2020) Comprehensive review of text-mining applications in finance. Financ Innov 6:1\u201325","journal-title":"Financ Innov"},{"key":"1113_CR18","doi-asserted-by":"publisher","first-page":"54","DOI":"10.1016\/j.eswa.2018.12.046","volume":"122","author":"Z He","year":"2019","unstructured":"He Z, Zhang S, Wu J (2019) Significance-based discriminative sequential pattern mining. Expert Syst Appl 122:54\u201364","journal-title":"Expert Syst Appl"},{"issue":"1","key":"1113_CR19","first-page":"251","volume":"35","author":"Z He","year":"2023","unstructured":"He Z, Wu Z, Xu G, Liu Y, Zou Q (2023) Decision tree for sequences. IEEE Trans Knowl Data Eng 35(1):251\u2013263","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"1113_CR20","doi-asserted-by":"crossref","unstructured":"Ifrim G, Bakir G, Weikum G (2008) Fast logistic regression for text categorization with variable-length n-grams. In: Proceedings of the 14th ACM SIGKDD international conference on knowledge discovery and data mining, pp 354\u2013362","DOI":"10.1145\/1401890.1401936"},{"key":"1113_CR21","doi-asserted-by":"crossref","unstructured":"Ifrim G, Wiuf C (2011) Bounded coordinate-descent for biological sequence classification in high dimensional predictor space. In: Proceedings of the 17th ACM SIGKDD international conference on knowledge discovery and data mining, pp 708\u2013716","DOI":"10.1145\/2020408.2020519"},{"key":"1113_CR22","doi-asserted-by":"publisher","first-page":"17233","DOI":"10.1007\/s00500-020-05015-2","volume":"24","author":"A Jamshed","year":"2020","unstructured":"Jamshed A, Mallick B, Kumar P (2020) Deep learning-based sequential pattern mining for progressive database. Soft Comput 24:17233\u201317246","journal-title":"Soft Comput"},{"issue":"3","key":"1113_CR23","doi-asserted-by":"publisher","first-page":"259","DOI":"10.1007\/s10115-006-0038-2","volume":"11","author":"X Ji","year":"2007","unstructured":"Ji X, Bailey J, Dong G (2007) Mining minimal distinguishing subsequence patterns with gap constraints. Knowl Inf Syst 11(3):259\u2013286","journal-title":"Knowl Inf Syst"},{"key":"1113_CR24","unstructured":"Jiang L, Bosch N (2021) Predictive sequential pattern mining via interpretable convolutional neural networks. In: Proceedings of the 14th international conference on educational data mining, International Educational Data Mining Society"},{"issue":"3","key":"1113_CR25","doi-asserted-by":"publisher","first-page":"553","DOI":"10.1016\/j.bbrc.2020.09.010","volume":"533","author":"K Kuzmin","year":"2020","unstructured":"Kuzmin K, Adeniyi AE, DaSouza AK, Lim D, Nguyen H, Molina NR, Xiong L, Weber IT, Harrison RW (2020) Machine learning methods accurately predict host specificity of coronaviruses based on spike sequences alone. Biochem Biophys Res Commun 533(3):553\u2013558","journal-title":"Biochem Biophys Res Commun"},{"issue":"1","key":"1113_CR26","doi-asserted-by":"publisher","first-page":"34","DOI":"10.1002\/sam.11192","volume":"7","author":"HT Lam","year":"2014","unstructured":"Lam HT, M\u00f6rchen F, Fradkin D, Calders T (2014) Mining compressing sequential patterns. Stat Anal Data Min: ASA Data Sci J 7(1):34\u201352","journal-title":"Stat Anal Data Min: ASA Data Sci J"},{"key":"1113_CR27","doi-asserted-by":"crossref","unstructured":"Lee J, Kim D, Ham B (2021)Network quantization with element-wise gradient scaling. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 6448\u20136457","DOI":"10.1109\/CVPR46437.2021.00638"},{"key":"1113_CR28","doi-asserted-by":"crossref","unstructured":"Lesh N, Zaki MJ, Ogihara M (1999) Mining features for sequence classification. In: Proceedings of the 5th ACM SIGKDD international conference on knowledge discovery and data mining, pp 342\u2013346","DOI":"10.1145\/312129.312275"},{"key":"1113_CR29","unstructured":"Liu H, Setiono R (1995) Chi2: Feature selection and discretization of numeric attributes. In: Proceedings of 7th IEEE international conference on tools with artificial intelligence, IEEE, pp 388\u2013391"},{"key":"1113_CR30","doi-asserted-by":"crossref","unstructured":"Lo D, Cheng H, Han J, Khoo S-C, Sun C (2009) Classification of software behaviors for failure detection: a discriminative pattern mining approach. In: Proceedings of the 15th ACM SIGKDD international conference on knowledge discovery and data mining, pp 557\u2013566","DOI":"10.1145\/1557019.1557083"},{"key":"1113_CR31","first-page":"419","volume":"2","author":"H Lodhi","year":"2002","unstructured":"Lodhi H, Saunders C, Shawe-Taylor J, Cristianini N, Watkins C (2002) Text classification using string kernels. J Mach Learn Res 2:419\u2013444","journal-title":"J Mach Learn Res"},{"key":"1113_CR32","doi-asserted-by":"crossref","unstructured":"Maggi FM, Bose RJC, Aalst WM (2012) Efficient discovery of understandable declarative process models from event logs. In: Proceedings of 24th international conference on advanced information systems engineering, Springer, pp 270\u2013285","DOI":"10.1007\/978-3-642-31095-9_18"},{"key":"1113_CR33","doi-asserted-by":"crossref","unstructured":"Maggi FM, Montali M, Di\u00a0Ciccio C, Mendling J (2016) Semantical vacuity detection in declarative process mining. In: Proceedings of the 14th international conference on business process management, Springer, pp 158\u2013175","DOI":"10.1007\/978-3-319-45348-4_10"},{"key":"1113_CR34","unstructured":"Nagel M, Fournarakis M, Bondarenko Y, Blankevoort T (2022) Overcoming oscillations in quantization-aware training. In: International conference on machine learning, PMLR, pp 16318\u201316330"},{"key":"1113_CR35","doi-asserted-by":"crossref","unstructured":"Nguyen D, Luo W, Nguyen TD, Venkatesh S, Phung D (2018) Sqn2vec: learning sequence representation via sequential patterns with a gap constraint. In: Joint European conference on machine learning and knowledge discovery in databases, Springer, pp 569\u2013584","DOI":"10.1007\/978-3-030-10928-8_34"},{"key":"1113_CR36","doi-asserted-by":"crossref","unstructured":"Nowak J, Korytkowski M, Scherer R (2020) Discovering sequential patterns by neural networks. In: 2020 international joint conference on neural networks (IJCNN), IEEE, pp 1\u20136","DOI":"10.1109\/IJCNN48605.2020.9207461"},{"key":"1113_CR37","doi-asserted-by":"crossref","unstructured":"Ntagiou AN, Tsipouras MG, Giannakeas N, Tzallas AT (2017) Protein structure recognition by means of sequential pattern mining. In: Proceedings of the 17th international conference on bioinformatics and bioengineering (BIBE), IEEE, pp 334\u2013339","DOI":"10.1109\/BIBE.2017.00-32"},{"key":"1113_CR38","doi-asserted-by":"crossref","unstructured":"Okanohara D, Tsujii J (2009) Text categorization with all substring features. In: Proceedings of the 2009 SIAM international conference on data mining, SIAM, pp 838\u2013846","DOI":"10.1137\/1.9781611972795.72"},{"key":"1113_CR39","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa F, Varoquaux G, Gramfort A, Michel V, Thirion B, Grisel O, Blondel M, Prettenhofer P, Weiss R, Dubourg V, Vanderplas J, Passos A, Cournapeau D, Brucher M, Perrot M, Duchesnay E (2011) Scikit-learn: machine learning in Python. J Mach Learn Res 12:2825\u20132830","journal-title":"J Mach Learn Res"},{"issue":"2","key":"1113_CR40","doi-asserted-by":"publisher","first-page":"133","DOI":"10.1007\/s10844-006-0006-z","volume":"28","author":"J Pei","year":"2007","unstructured":"Pei J, Han J, Wang W (2007) Constraint-based sequential pattern mining: the pattern-growth methods. J Intel Inf Syst 28(2):133\u2013160","journal-title":"J Intel Inf Syst"},{"key":"1113_CR41","doi-asserted-by":"crossref","unstructured":"Qiao L, Wang W, Lin B (2021) Learning accurate and interpretable decision rule sets from neural networks. In: Proceedings of the AAAI conference on artificial intelligence, vol 35. pp 4303\u20134311","DOI":"10.1609\/aaai.v35i5.16555"},{"issue":"2","key":"1113_CR42","doi-asserted-by":"publisher","first-page":"668","DOI":"10.1007\/s10618-021-00813-0","volume":"36","author":"C Ranjan","year":"2022","unstructured":"Ranjan C, Ebrahimi S, Paynabar K (2022) Sequence graph transform (SGT): a feature embedding function for sequence data mining. Data Min Knowl Disc 36(2):668\u2013708","journal-title":"Data Min Knowl Disc"},{"key":"1113_CR43","doi-asserted-by":"crossref","unstructured":"Rastegari M, Ordonez V, Redmon J, Farhadi A (2016) Xnor-net: imagenet classification using binary convolutional neural networks. In: Proceedings of the 2016 European conference on computer vision, Springer pp 525\u2013542","DOI":"10.1007\/978-3-319-46493-0_32"},{"key":"1113_CR44","doi-asserted-by":"crossref","unstructured":"Shvo M, Li AC, Icarte RT, McIlraith SA (2021) Interpretable sequence classification via discrete optimization. In: Proceedings of the AAAI conference on artificial intelligence, vol 35. pp 9647\u20139656","DOI":"10.1609\/aaai.v35i11.17161"},{"key":"1113_CR45","unstructured":"Singh N (2024) Demystify DNA Sequencing with Machine Learning. Kaggle. https:\/\/www.kaggle.com\/code\/nageshsingh\/demystify-dna-sequencing-with-machine-learning\/notebook"},{"key":"1113_CR46","doi-asserted-by":"crossref","unstructured":"Srikant R, Agrawal R (1996) Mining sequential patterns: generalizations and performance improvements. In: Proceedings of the advances in database technology\u2013EDBT\u201996: 5th international conference on extending database technology, Springer, pp 1\u201317","DOI":"10.1007\/BFb0014140"},{"key":"1113_CR47","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1016\/j.asoc.2014.10.029","volume":"27","author":"C-Y Tsai","year":"2015","unstructured":"Tsai C-Y, Chen C-J (2015) A PSO-AB classifier for solving sequence classification problems. Appl Soft Comput 27:11\u201327","journal-title":"Appl Soft Comput"},{"key":"1113_CR48","doi-asserted-by":"crossref","unstructured":"Tu Z, Chen X, Ren P, Wang Y (2022) AdaBin: improving binary neural networks with adaptive binary sets. In: European conference on computer vision, Springer, pp 379\u2013395","DOI":"10.1007\/978-3-031-20083-0_23"},{"key":"1113_CR49","doi-asserted-by":"crossref","unstructured":"Wang Z, Zhang W, Ning L, Wang J (2020) Transparent classification with multilayer logical perceptrons and random binarization. In: Proceedings of the AAAI conference on artificial intelligence, vol 34. pp 6331\u20136339","DOI":"10.1609\/aaai.v34i04.6102"},{"key":"1113_CR50","first-page":"30479","volume":"34","author":"Z Wang","year":"2021","unstructured":"Wang Z, Zhang W, Liu N, Wang J (2021) Scalable rule-based representation learning for interpretable classification. Adv Neural Inf Process Syst 34:30479\u201330491","journal-title":"Adv Neural Inf Process Syst"},{"key":"1113_CR51","volume":"10","author":"W Wang","year":"2022","unstructured":"Wang W, Qiao L, Lin B (2022) Tabular machine learning using conjunctive threshold neural networks. Mach Learn Appl 10:100429","journal-title":"Mach Learn Appl"},{"key":"1113_CR52","doi-asserted-by":"crossref","unstructured":"Wu J, Leng C, Wang Y, Hu Q, Cheng J (2016) Quantized convolutional neural networks for mobile devices. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 4820\u20134828","DOI":"10.1109\/CVPR.2016.521"},{"issue":"1","key":"1113_CR53","doi-asserted-by":"publisher","first-page":"40","DOI":"10.1145\/1882471.1882478","volume":"12","author":"Z Xing","year":"2010","unstructured":"Xing Z, Pei J, Keogh E (2010) A brief survey on sequence classification. SIGKDD Explor Newsl 12(1):40\u201348","journal-title":"SIGKDD Explor Newsl"},{"issue":"1","key":"1113_CR54","doi-asserted-by":"publisher","first-page":"7238","DOI":"10.1038\/s41467-022-34904-3","volume":"13","author":"W-F Zeng","year":"2022","unstructured":"Zeng W-F, Zhou X-X, Willems S, Ammar C, Wahle M, Bludau I, Voytik E, Strauss MT, Mann M (2022) AlphaPeptDeep: a modular deep learning framework to predict peptide properties for proteomics. Nat Commun 13(1):7238","journal-title":"Nat Commun"},{"key":"1113_CR55","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.knosys.2015.06.014","volume":"89","author":"J Zhang","year":"2015","unstructured":"Zhang J, Wang Y, Yang D (2015) CCSpan: mining closed contiguous sequential patterns. Knowl-Based Syst 89:1\u201313","journal-title":"Knowl-Based Syst"},{"issue":"5","key":"1113_CR56","doi-asserted-by":"publisher","first-page":"1285","DOI":"10.1109\/TKDE.2015.2510010","volume":"28","author":"C Zhou","year":"2016","unstructured":"Zhou C, Cule B, Goethals B (2016) Pattern based sequence classification. IEEE Trans Knowl Data Eng 28(5):1285\u20131298","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"1113_CR57","unstructured":"Zhou S, Wu Y, Ni Z, Zhou X, Wen H, Zou Y (2016) Dorefa-net: training low bitwidth convolutional neural networks with low bitwidth gradients. arXiv preprint arXiv:1606.06160"}],"container-title":["Data Mining and Knowledge Discovery"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10618-025-01113-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10618-025-01113-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10618-025-01113-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,6]],"date-time":"2025-09-06T19:06:51Z","timestamp":1757185611000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10618-025-01113-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,6,10]]},"references-count":57,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2025,7]]}},"alternative-id":["1113"],"URL":"https:\/\/doi.org\/10.1007\/s10618-025-01113-7","relation":{},"ISSN":["1384-5810","1573-756X"],"issn-type":[{"type":"print","value":"1384-5810"},{"type":"electronic","value":"1573-756X"}],"subject":[],"published":{"date-parts":[[2025,6,10]]},"assertion":[{"value":"21 October 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"22 May 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"10 June 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"40"}}