{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,5,24]],"date-time":"2024-05-24T19:00:09Z","timestamp":1716577209368},"reference-count":59,"publisher":"Springer Science and Business Media LLC","issue":"6","license":[{"start":{"date-parts":[[2014,11,4]],"date-time":"2014-11-04T00:00:00Z","timestamp":1415059200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Data Min Knowl Disc"],"published-print":{"date-parts":[[2015,11]]},"DOI":"10.1007\/s10618-014-0391-9","type":"journal-article","created":{"date-parts":[[2014,11,3]],"date-time":"2014-11-03T07:47:43Z","timestamp":1415000863000},"page":"1685-1708","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":12,"title":["Learning sequential classifiers from long and noisy discrete-event sequences efficiently"],"prefix":"10.1007","volume":"29","author":[{"given":"Gess\u00e9","family":"Daf\u00e9","sequence":"first","affiliation":[]},{"given":"Adriano","family":"Veloso","sequence":"additional","affiliation":[]},{"given":"Mohammed","family":"Zaki","sequence":"additional","affiliation":[]},{"suffix":"Jr.","given":"Wagner","family":"Meira","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2014,11,4]]},"reference":[{"key":"391_CR1","doi-asserted-by":"crossref","unstructured":"Agrawal R, Srikant R (1995) Mining sequential patterns. In: ICDE, pp 3\u201314","DOI":"10.1109\/ICDE.1995.380415"},{"key":"391_CR2","unstructured":"Bannister W (2007) Associative and sequential classification with adaptive constrained regression methods. PhD thesis, Tempe, AZ, USA"},{"issue":"6","key":"391_CR3","doi-asserted-by":"publisher","first-page":"1554","DOI":"10.1214\/aoms\/1177699147","volume":"37","author":"L Baum","year":"1966","unstructured":"Baum L, Petrie T (1966) Statistical inference for probabilistic functions of finite state Markov chains. Ann Math Stat 37(6):1554\u20131563","journal-title":"Ann Math Stat"},{"key":"391_CR4","doi-asserted-by":"publisher","first-page":"164","DOI":"10.1214\/aoms\/1177697196","volume":"41","author":"L Baum","year":"1970","unstructured":"Baum L, Petrie T, Soules G, Weiss N (1970) A maximization technique occurring in the statistical analysis of probabilistic functions of Markov chains. Ann Math Stat 41:164","journal-title":"Ann Math Stat"},{"issue":"9\u201310","key":"391_CR5","doi-asserted-by":"publisher","first-page":"1395","DOI":"10.1016\/S0167-8655(02)00380-X","volume":"24","author":"M Bicego","year":"2003","unstructured":"Bicego M, Murino V, Figueiredo M (2003a) A sequential pruning strategy for the selection of the number of states in hidden Markov models. Pattern Recognit Lett 24(9\u201310):1395\u20131407","journal-title":"Pattern Recognit Lett"},{"issue":"12","key":"391_CR6","doi-asserted-by":"publisher","first-page":"2281","DOI":"10.1016\/S0031-3203(04)00162-1","volume":"37","author":"M Bicego","year":"2004","unstructured":"Bicego M, Murino V, Figueiredo M (2004) Similarity-based classification of sequences using hidden Markov models. Pattern Recognit 37(12):2281\u20132291","journal-title":"Pattern Recognit"},{"issue":"10","key":"391_CR7","doi-asserted-by":"publisher","first-page":"1813","DOI":"10.1016\/j.patcog.2006.04.004","volume":"39","author":"M Bicego","year":"2006","unstructured":"Bicego M, Murino V, Pelillo M, Torsello A (2006) Similarity-based pattern recognition. Pattern Recognit 39(10):1813\u20131814","journal-title":"Pattern Recognit"},{"issue":"2","key":"391_CR8","doi-asserted-by":"publisher","first-page":"480","DOI":"10.1214\/aos\/1018031204","volume":"27","author":"P B\u00fchlmann","year":"1999","unstructured":"B\u00fchlmann P, Wyner A (1999) Variable length Markov chains. Ann Stat 27(2):480\u2013513","journal-title":"Ann Stat"},{"key":"391_CR9","doi-asserted-by":"crossref","unstructured":"Chang CC, Lin CJ (2011) LIBSVM: a library for support vector machines. ACM Trans Intell Syst Technol 2:27:1\u201327:27, software available at http:\/\/www.csie.ntu.edu.tw\/cjlin\/libsvm","DOI":"10.1145\/1961189.1961199"},{"key":"391_CR10","unstructured":"Davis A, Veloso A, da Silva A, Laender A, Meira W Jr (2012) Named entity disambiguation in streaming data. In: ACL, pp 815\u2013824"},{"issue":"2","key":"391_CR11","doi-asserted-by":"publisher","first-page":"163","DOI":"10.1145\/990301.990304","volume":"4","author":"M Deshpande","year":"2004","unstructured":"Deshpande M, Karypis G (2004) Selective Markov models for predicting web page accesses. ACM Trans Internet Technol 4(2):163\u2013184","journal-title":"ACM Trans Internet Technol"},{"key":"391_CR12","doi-asserted-by":"crossref","unstructured":"Durbin R, Eddy AKS, Mitchison G (1998) Biological sequence analysis. Cambridge University Press","DOI":"10.1017\/CBO9780511790492"},{"key":"391_CR13","doi-asserted-by":"crossref","unstructured":"Durbin R, Eddy S, Krogh A, Mitchison G (1998) Biological sequence analysis: probabilistic models of proteins and nucleic acids. Cambridge University Press","DOI":"10.1017\/CBO9780511790492"},{"issue":"1","key":"391_CR14","doi-asserted-by":"publisher","first-page":"23","DOI":"10.1006\/csla.1997.0037","volume":"12","author":"J Preez Du","year":"1998","unstructured":"Du Preez J (1998) Efficient training of high-order hidden Markov models using first-order representations. Comput Speech Lang 12(1):23\u201339","journal-title":"Comput Speech Lang"},{"issue":"9","key":"391_CR15","doi-asserted-by":"publisher","first-page":"755","DOI":"10.1093\/bioinformatics\/14.9.755","volume":"14","author":"S Eddy","year":"1998","unstructured":"Eddy S (1998) Profile hidden Markov models. Bioinformatics 14(9):755\u2013763","journal-title":"Bioinformatics"},{"key":"391_CR16","unstructured":"Galassi U, Giordana A, Saitta L (2007) Incremental construction of structured hidden Markov models. In: IJCAI, pp 798\u2013803"},{"key":"391_CR17","unstructured":"Golding A, Roth D (1996) Applying winnow to context-sensitive spelling correction. CoRR"},{"key":"391_CR18","doi-asserted-by":"crossref","unstructured":"Han H, Giles C, Zha H, Li C, Tsioutsiouliklis K (2004) Two supervised learning approaches for name disambiguation in author citations. In: JCDL, pp 296\u2013305","DOI":"10.1145\/996350.996419"},{"key":"391_CR19","doi-asserted-by":"crossref","unstructured":"Han H, Zha H, Giles C (2005) Name disambiguation in author citations using a k-way spectral clustering method. In: JCDL, pp 334\u2013343","DOI":"10.1145\/1065385.1065462"},{"key":"391_CR20","unstructured":"Haussler D (1999) Convolution kernels on discrete structures. Tech. rep,Technical report, UC Santa Cruz"},{"issue":"10","key":"391_CR21","doi-asserted-by":"publisher","first-page":"1039","DOI":"10.1109\/34.541414","volume":"18","author":"J Hu","year":"1996","unstructured":"Hu J, Brown M, Turin W (1996) Hmm based on-line handwriting recognition. IEEE Trans Pattern Anal Mach Intell 18(10):1039\u20131045","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"2","key":"391_CR22","first-page":"95","volume":"12","author":"R Hughey","year":"1996","unstructured":"Hughey R, Krogh A (1996) Hidden Markov models for sequence analysis: extension and analysis of the basic method. Comput Appl Biosci 12(2):95\u2013107","journal-title":"Comput Appl Biosci"},{"key":"391_CR23","doi-asserted-by":"crossref","unstructured":"Kriouile A, Mari J, Haon J (1990) Some improvements in speech recognition algorithms based on HMM. In: ICASSP, pp 545\u2013548","DOI":"10.1109\/ICASSP.1990.115770"},{"key":"391_CR24","unstructured":"Kuksa P, Huang PH, Pavlovic V (2008) A fast, large-scale learning method for protein sequence classification. In: 8th international workshop on data mining in bioinformatics, pp 29\u201337"},{"issue":"3","key":"391_CR25","doi-asserted-by":"publisher","first-page":"295","DOI":"10.1145\/322510.322526","volume":"2","author":"T Lane","year":"1999","unstructured":"Lane T, Brodley C (1999) Temporal sequence learning and data reduction for anomaly detection. ACM Trans Inf Syst Secur 2(3):295\u2013331","journal-title":"ACM Trans Inf Syst Secur"},{"key":"391_CR26","doi-asserted-by":"crossref","unstructured":"Law H, Chan C (1996) N-th order ergodic multigram hmm for modeling of languages without marked word boundaries. In: COLING, pp 204\u2013209","DOI":"10.3115\/992628.992666"},{"key":"391_CR27","doi-asserted-by":"crossref","unstructured":"Lesh N, Zaki M, Ogihara M (1999) Mining features for sequence classification. In: KDD, pp 342\u2013346","DOI":"10.1145\/312129.312275"},{"key":"391_CR28","doi-asserted-by":"crossref","unstructured":"Leslie C, Kuang R (2003) Fast kernels for inexact string matching. In: COLT, pp 114\u2013128","DOI":"10.1007\/978-3-540-45167-9_10"},{"key":"391_CR29","first-page":"1435","volume":"5","author":"C Leslie","year":"2004","unstructured":"Leslie C, Kuang R (2004) Fast string kernels using inexact matching for protein sequences. J Mach Learn Res 5:1435\u20131455","journal-title":"J Mach Learn Res"},{"key":"391_CR30","first-page":"566","volume":"7","author":"C Leslie","year":"2002","unstructured":"Leslie C, Eskin E, Noble WS (2002a) The spectrum kernel: a string kernel for SVM protein classification. Pac Symp Biocomput 7:566\u2013575","journal-title":"Pac Symp Biocomput"},{"key":"391_CR31","unstructured":"Leslie C, Eskin E, Weston J, Noble W (2002b) Mismatch string kernels for SVM protein classification. In: NIPS, pp 1417\u20131424"},{"issue":"4","key":"391_CR32","doi-asserted-by":"publisher","first-page":"467","DOI":"10.1093\/bioinformatics\/btg431","volume":"20","author":"C Leslie","year":"2004","unstructured":"Leslie C, Eskin E, Cohen A, Weston J, Noble W (2004) Mismatch string kernels for discriminative protein classification. Bioinformatics 20(4):467\u2013476","journal-title":"Bioinformatics"},{"key":"391_CR33","doi-asserted-by":"crossref","unstructured":"Lin M, Hsueh S, Chen M, Hsu H (2009) Mining sequential patterns for image classification in ubiquitous multimedia systems. In: IIH-MSP, pp 303\u2013306","DOI":"10.1109\/IIH-MSP.2009.261"},{"key":"391_CR34","first-page":"419","volume":"2","author":"H Lodhi","year":"2002","unstructured":"Lodhi H, Saunders C, Shawe-Taylor J, Cristianini N, Watkins C (2002) Text classification using string kernels. J Mach Learn Res 2:419\u2013444","journal-title":"J Mach Learn Res"},{"issue":"2","key":"391_CR35","doi-asserted-by":"publisher","first-page":"117","DOI":"10.1145\/1809400.1809424","volume":"11","author":"H Lodhi","year":"2009","unstructured":"Lodhi H, Muggleton S, Sternberg M (2009) Multi-class protein fold recognition using large margin logic based divide and conquer learning. SIGKDD Explor 11(2):117\u2013122","journal-title":"SIGKDD Explor"},{"key":"391_CR36","doi-asserted-by":"crossref","unstructured":"Malik H, Kender J (2008) Classifying high-dimensional text and web data using very short patterns. In: ICDM, pp 923\u2013928","DOI":"10.1109\/ICDM.2008.139"},{"key":"391_CR37","doi-asserted-by":"crossref","unstructured":"M\u00fcller S, Eickeler S, Rigoll G (2000) Crane gesture recognition using pseudo 3-d hidden Markov models. In: FG (Conf. on Automatic Face and Gesture Recognition), pp 398\u2013402","DOI":"10.1109\/AFGR.2000.840665"},{"issue":"4","key":"391_CR38","first-page":"536","volume":"247","author":"A Murzin","year":"1995","unstructured":"Murzin A, Brenner S, Hubbard T, Chothia C (1995) SCOP: a structural classification of proteins database for the investigation of sequences and structures. J Mol Biol 247(4):536\u2013540","journal-title":"J Mol Biol"},{"key":"391_CR39","unstructured":"Pitkow J, Pirolli P (1999) Mining longest repeating subsequences to predict world wide web surfing. In: USENIX symposium on Internet technologies and systems"},{"issue":"2","key":"391_CR40","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1109\/5.18626","volume":"77","author":"L Rabiner","year":"1989","unstructured":"Rabiner L (1989) A tutorial on hidden Markov models and selected applications in speech recognition. Proc IEEE 77(2):257\u2013286","journal-title":"Proc IEEE"},{"key":"391_CR41","first-page":"23","volume":"9","author":"K Rieck","year":"2008","unstructured":"Rieck K, Laskov P (2008) Linear-time computation of similarity measures for sequential data. J Mach Learn Res 9:23\u201348","journal-title":"J Mach Learn Res"},{"issue":"1","key":"391_CR42","first-page":"1323","volume":"6","author":"J Rousu","year":"2005","unstructured":"Rousu J, Shawe-Taylor J (2005) Efficient computation of gapped substring kernels on large alphabets. J Mach Learn Res 6(1):1323\u20131344","journal-title":"J Mach Learn Res"},{"issue":"1","key":"391_CR43","doi-asserted-by":"publisher","first-page":"75","DOI":"10.1023\/A:1007649326333","volume":"37","author":"L Saul","year":"1999","unstructured":"Saul L, Jordan M (1999) Mixed memory Markov models: decomposing complex stochastic processes as mixtures of simpler ones. Mach Learn 37(1):75\u201387","journal-title":"Mach Learn"},{"key":"391_CR44","doi-asserted-by":"crossref","unstructured":"Schwardt L, Preez JD (2000) Efficient mixed-order hidden Markov model inference. In: ICSLP, pp 238\u2013241","DOI":"10.21437\/ICSLP.2000-253"},{"key":"391_CR45","unstructured":"Sha F, Saul L (2006) Large margin hidden Markov models for automatic speech recognition. In: NIPS, pp 1249\u20131256"},{"key":"391_CR46","doi-asserted-by":"crossref","unstructured":"Silva I, Gomide J, Veloso A, Meira Jr W, Ferreira R (2011) Effective sentiment stream analysis with self-augmenting training and demand-driven projection. In: SIGIR, pp 475\u2013484","DOI":"10.1145\/2009916.2009981"},{"key":"391_CR47","doi-asserted-by":"crossref","unstructured":"Srikant R, Agrawal R (1996) Mining sequential patterns: generalizations and performance improvements. In: EDBT, pp 3\u201317","DOI":"10.1007\/BFb0014140"},{"key":"391_CR48","first-page":"1505","volume":"17","author":"L Srivatsan","year":"2005","unstructured":"Srivatsan L, Sastry P, Unnikrishnan K (2005) Discovering frequent episodes and learning hidden Markov models: a formal connection. IEEE TKDE 17:1505\u20131517","journal-title":"IEEE TKDE"},{"key":"391_CR49","first-page":"1913","volume":"10","author":"Z Syed","year":"2009","unstructured":"Syed Z, Indyk P, Guttag J (2009) Learning approximate sequential patterns for classification. J Mach Learn Res 10:1913\u20131936","journal-title":"J Mach Learn Res"},{"key":"391_CR50","doi-asserted-by":"crossref","unstructured":"Szymanski B (2004) Recursive data mining for masquerade detection and author identification. Workshop on Information Assurance, pp 424\u2013431","DOI":"10.1109\/IAW.2004.1437848"},{"key":"391_CR51","doi-asserted-by":"crossref","unstructured":"Tseng V, Lee C (2005) CBS: a new classification method by using sequential patterns. In: SDM","DOI":"10.1137\/1.9781611972757.68"},{"key":"391_CR52","unstructured":"Vapnik V (1979) Estimation of dependences based on empirical data (in Russian). Nauka"},{"key":"391_CR53","doi-asserted-by":"crossref","unstructured":"Veloso A, Meira W Jr (2011) Demand-driven associative classification. Springer","DOI":"10.1007\/978-0-85729-525-5"},{"key":"391_CR54","doi-asserted-by":"crossref","unstructured":"Wang Y, Zhou L, Feng J, Wang J, Liu Z (2006) Mining complex time-series data by learning Markovian models. In: ICDM, pp 1136\u20131140","DOI":"10.1109\/ICDM.2006.105"},{"key":"391_CR55","unstructured":"Watkins C (1999) Dynamic alignment kernels. Advances in neural information processing systems, pp 39\u201350"},{"key":"391_CR56","doi-asserted-by":"crossref","unstructured":"Ye L, Keogh E (2009) Time series shapelets: a new primitive for data mining. In: KDD, pp 947\u2013956","DOI":"10.1145\/1557019.1557122"},{"issue":"1\u20132","key":"391_CR57","doi-asserted-by":"publisher","first-page":"149","DOI":"10.1007\/s10618-010-0179-5","volume":"22","author":"L Ye","year":"2011","unstructured":"Ye L, Keogh E (2011) Time series shapelets: a novel technique that allows accurate, interpretable and fast classification. Data Min Knowl Discov 22(1\u20132):149\u2013182","journal-title":"Data Min Knowl Discov"},{"key":"391_CR58","doi-asserted-by":"crossref","unstructured":"Zaki M (2000) Sequence mining in categorical domains: Incorporating constraints. In: CIKM, pp 422\u2013429","DOI":"10.1145\/354756.354849"},{"key":"391_CR59","doi-asserted-by":"crossref","unstructured":"Zaki M, Carothers C, Szymanski B (2010) Vogue: a variable order hidden Markov model with duration based on frequent sequence mining. TKDD 4(1):1\u201331","DOI":"10.1145\/1644873.1644878"}],"container-title":["Data Mining and Knowledge Discovery"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10618-014-0391-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10618-014-0391-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10618-014-0391-9","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10618-014-0391-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,7,17]],"date-time":"2023-07-17T19:58:48Z","timestamp":1689623928000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10618-014-0391-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014,11,4]]},"references-count":59,"journal-issue":{"issue":"6","published-print":{"date-parts":[[2015,11]]}},"alternative-id":["391"],"URL":"https:\/\/doi.org\/10.1007\/s10618-014-0391-9","relation":{},"ISSN":["1384-5810","1573-756X"],"issn-type":[{"value":"1384-5810","type":"print"},{"value":"1573-756X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2014,11,4]]},"assertion":[{"value":"2 March 2014","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 October 2014","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 November 2014","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}