{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,26]],"date-time":"2025-06-26T04:06:45Z","timestamp":1750910805866,"version":"3.41.0"},"reference-count":41,"publisher":"Springer Science and Business Media LLC","issue":"S5","license":[{"start":{"date-parts":[[2017,9,4]],"date-time":"2017-09-04T00:00:00Z","timestamp":1504483200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Cluster Comput"],"published-print":{"date-parts":[[2019,9]]},"DOI":"10.1007\/s10586-017-1137-4","type":"journal-article","created":{"date-parts":[[2017,9,4]],"date-time":"2017-09-04T06:54:18Z","timestamp":1504508058000},"page":"10605-10614","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["A hybrid approach for mismatch data reduction in datasets and guide data mining"],"prefix":"10.1007","volume":"22","author":[{"given":"R.","family":"Dhanalakshmi","sequence":"first","affiliation":[]},{"given":"T.","family":"Sethukarasi","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2017,9,4]]},"reference":[{"key":"1137_CR1","unstructured":"Han, J., Kamber, M.: Data Mining\u2014Concepts & Techniques. Morgan Kaufmann Publishers, Academic Press (2001)"},{"key":"1137_CR2","unstructured":"Sankar\u00a0Rajagopal, D.R.: Customer data clustering using data mining technique. Int. J. Database Manag. Syst. 3(4) (2011)"},{"issue":"1","key":"1137_CR3","doi-asserted-by":"publisher","first-page":"25","DOI":"10.7763\/IJCCE.2013.V2.128","volume":"2","author":"J Yabing","year":"2013","unstructured":"Yabing, J.: Research of an improved apriori algorithm in data mining association rule. Int. J. Comput. Commun. Eng. 2(1), 25 (2013)","journal-title":"Int. J. Comput. Commun. Eng."},{"key":"1137_CR4","unstructured":"Fournier-Viger, P., Lin, J.C.W., Kiran, R.U., Koh, Y.S., Thomas, R.: A survey of sequential pattern mining. Data Sci. Pattern Recognit. Ubiquitous Int. 1(1) (2017)"},{"issue":"3","key":"1137_CR5","doi-asserted-by":"publisher","first-page":"1333","DOI":"10.1007\/s10586-016-0589-2","volume":"19","author":"L Lin","year":"2016","unstructured":"Lin, L., Ye, J., Deng, F., Xiong, S., Zhong, L.: A comparison study of clustering algorithms for microblog posts. Cluster Comput. 19(3), 1333\u20131345 (2016)","journal-title":"Cluster Comput."},{"issue":"4","key":"1137_CR6","doi-asserted-by":"publisher","first-page":"1723","DOI":"10.1007\/s10586-016-0643-0","volume":"19","author":"NK Kamila","year":"2016","unstructured":"Kamila, N.K., Jena, L., Bhuyan, H.K.: Pareto-based multi-objective optimization for classification in data mining. Cluster Comput. 19(4), 1723\u20131745 (2016)","journal-title":"Cluster Comput."},{"key":"1137_CR7","doi-asserted-by":"crossref","unstructured":"Wang, J., Su, X.: An improved K-means clustering algorithm. In: 2011 IEEE 3rd International Conference on Communication Software and Networks, Xi\u2019an, pp. 44\u201346 (2011)","DOI":"10.1109\/ICCSN.2011.6014384"},{"issue":"3","key":"1137_CR8","doi-asserted-by":"publisher","first-page":"291","DOI":"10.1023\/A:1009700419189","volume":"1","author":"T Fawcett","year":"1997","unstructured":"Fawcett, T., Provost, F.: Adaptive fraud detection. Data Min. Knowl. Discov. J. 1(3), 291\u2013316 (1997)","journal-title":"Data Min. Knowl. Discov. J."},{"key":"1137_CR9","unstructured":"DuMouchel, W., Schonlau, M.: A fast computer intrusion detection algorithm based on hypothesis testing of command transition probabilities. In: Proceedings of the 4th International Conference on Knowledge Discovery and Data Mining, pp. 189\u2013193 (1998)"},{"key":"1137_CR10","series-title":"Lecture Notes in Artificial Intelligence","first-page":"340","volume-title":"Mining the Knowledge Mine: The Hot Spots Methodology for Mining Large Real World Databases","author":"G Williams","year":"1997","unstructured":"Williams, G., Huang, Z.: Advanced topics in artificial intelligence. In: Sattar, A. (ed.) Mining the Knowledge Mine: The Hot Spots Methodology for Mining Large Real World Databases. Lecture Notes in Artificial Intelligence, vol. 1342, pp. 340\u2013348. Springer, Berlin (1997)"},{"key":"1137_CR11","doi-asserted-by":"crossref","unstructured":"Yamanishi, K., Takeuchi, J., Williams, G., Milne, P.: On-line unsupervised outlier detection using finite mixtures with discounting learning algorithm. In: Proceedings of KDD2000, pp. 320\u2013324 (2000)","DOI":"10.1145\/347090.347160"},{"key":"1137_CR12","doi-asserted-by":"crossref","unstructured":"Breunig, M., Kriegel, H., Ng, R., Sander, J.: Lof: identifying density-based local outliers. In: Proceedings of ACM SIGMOD, International Conference on Management of Data (2000)","DOI":"10.1145\/342009.335388"},{"key":"1137_CR13","doi-asserted-by":"crossref","unstructured":"Ramaswamy, S., Rastogi, R., Shim K.: Efficient algorithms for mining outliers from large data sets. In: Proceedings of International Conference on Management of Data, ACM-SIGMOD, Dallas (2000)","DOI":"10.1145\/342009.335437"},{"key":"1137_CR14","unstructured":"Knorr, E., Ng, R.: Algorithms for mining distance-based outliers in large datasets. In: Proceedings of 24rd International Conference on Very Large Data Bases (VLDB), pp. 392\u2013403 (1998)"},{"key":"1137_CR15","doi-asserted-by":"publisher","first-page":"1329","DOI":"10.1080\/01621459.1994.10476872","volume":"89","author":"AC Atkinson","year":"1994","unstructured":"Atkinson, A.C.: Fast very robust methods for the detection of multiple outliers. J. Am. Stat. Assoc. 89, 1329\u20131339 (1994)","journal-title":"J. Am. Stat. Assoc."},{"key":"1137_CR16","doi-asserted-by":"crossref","unstructured":"Kosinksi, A.S.: A procedure for the detection of multivariate outliers. Comput. Stat. Data Anal. 29 (1999)","DOI":"10.1016\/S0167-9473(98)00073-5"},{"key":"1137_CR17","unstructured":"Knorr, E., Ng, R.: A unified approach for mining outliers. In: Proceedings of KDD, pp. 219\u2013222 (1997)"},{"key":"1137_CR18","unstructured":"Knorr, E., Ng, R.: Algorithms for mining distance-based outliers in large datasets. In: Proceedings of 24th International Conference on Very Large Data Bases, VLDB, pp. 392\u2013 403, 24\u201327 (1998)"},{"issue":"5","key":"1137_CR19","doi-asserted-by":"publisher","first-page":"657","DOI":"10.1109\/TPAMI.2005.95","volume":"27","author":"JZ Huang","year":"2005","unstructured":"Huang, J.Z., et al.: Automated variable weighting in k-means type clustering. IEEE Trans. Pattern Anal. Mach. Intell. 27(5), 657\u2013668 (2005)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"5","key":"1137_CR20","doi-asserted-by":"publisher","first-page":"943","DOI":"10.1016\/j.patcog.2003.11.003","volume":"37","author":"EY Chan","year":"2004","unstructured":"Chan, E.Y., et al.: An optimization algorithm for clustering using weighted dissimilarity measures. Pattern Recognit. 37(5), 943\u2013952 (2004)","journal-title":"Pattern Recognit."},{"key":"1137_CR21","doi-asserted-by":"crossref","unstructured":"Huang, J.Z., et al.: Weighting method for feature selection in K-means. In: Computational Methods of Feature Selection , pp. 193\u2013210 (2008)","DOI":"10.1201\/9781584888796.ch10"},{"issue":"3","key":"1137_CR22","doi-asserted-by":"publisher","first-page":"1061","DOI":"10.1016\/j.patcog.2011.08.012","volume":"45","author":"RC Amorim de","year":"2012","unstructured":"de Amorim, R.C., Mirkin, B.: Minkowski metric, feature weighting and anomalous cluster initializing in K-means clustering. Pattern Recognit. 45(3), 1061\u20131075 (2012)","journal-title":"Pattern Recognit."},{"issue":"1","key":"1137_CR23","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1023\/A:1015608814486","volume":"12","author":"E Hung","year":"2002","unstructured":"Hung, E., Cheung, D.W.: Parallel mining of outliers in large database. Distrib. Parallel Databases 12(1), 5\u201326 (2002)","journal-title":"Distrib. Parallel Databases"},{"key":"1137_CR24","doi-asserted-by":"crossref","unstructured":"Lozano, E., Acuna, E.: Parallel algorithms for distance-based and density-based outliers. In: Proceedings of Fifth IEEE International Conference on Data Mining (ICDM), pp. 729\u2013732 (2005)","DOI":"10.1109\/ICDM.2005.116"},{"key":"1137_CR25","doi-asserted-by":"crossref","unstructured":"Bay, S.D., Schwabacher, M.: Mining distance-based outliers in near linear time with randomization and a simple pruning rule. In: Proceedings of Ninth ACM SIGKDD International Conference on Knowledge Discovery and Data Mining (KDD) (2003)","DOI":"10.1145\/956750.956758"},{"key":"1137_CR26","unstructured":"Ng, R., Han, J.: Efficient and effective clustering methods for spatial data mining. In: Proceedings of 20th VLDB, pp. 144\u2013155 (1994)"},{"key":"1137_CR27","unstructured":"Ester, M., Kriegel, H.P., Sander, J., Xu, X.: A density-based algorithm for discovering clusters in large spatial databases with noise. In: Proceedings of KDD, pp. 226\u2013231 (1999)"},{"key":"1137_CR28","doi-asserted-by":"crossref","unstructured":"Zhang, T., Ramakrishnan, R., Livny M.: An efficient data clustering method for very large databases. In: Proceedings of ACM SIGMOD, pp. 103\u2013114 (1996)","DOI":"10.1145\/235968.233324"},{"key":"1137_CR29","unstructured":"Kollios, G., Gunopoulos, D., Koudas, N., Berchtold, S.: An efficient approximation scheme for data mining tasks. In: ICDE (2001)"},{"issue":"4","key":"1137_CR30","first-page":"487","volume":"6","author":"A Bartkowiak","year":"1997","unstructured":"Bartkowiak, A., Szustalewicz, A.: Detecting multivariate outliers by a grand tour. Mach. Graph. Vis. 6(4), 487\u2013505 (1997)","journal-title":"Mach. Graph. Vis."},{"key":"1137_CR31","first-page":"24","volume-title":"The Integrated Delivery of Large-Scale Data Mining: The ACSys Data Mining Project","author":"G Williams","year":"2000","unstructured":"Williams, G., Altas, I., Bakin, S., Christen, P., Hegland, Markus, Marquez, Alonso, Milne, Peter, Nagappan, Rajehndra, Roberts, Stephen: Large-scale parallel data mining, LNAI state-of-the art survey. In: Zaki, M.J., Ho, C.-T. (eds.) The Integrated Delivery of Large-Scale Data Mining: The ACSys Data Mining Project, pp. 24\u201354. Springer, Berlin (2000)"},{"key":"1137_CR32","unstructured":"Swayne, D.F., Cook, D., Buja A.: XGobi: interactive dynamic graphics in the X window system with a link to S. In: Proceedings of the ASA Section on Statistical Graphics, pp. 1\u20138, Alexandria, VA. American Statistical Association (1991)"},{"key":"1137_CR33","unstructured":"Sykacek, P.: Equivalent error bars for neural network classifiers trained by Bayesian inference. In: Proceedings of ESANN (1997)"},{"key":"1137_CR34","doi-asserted-by":"publisher","first-page":"147","DOI":"10.1207\/s15516709cog0901_7","volume":"9","author":"DH Ackley","year":"1985","unstructured":"Ackley, D.H., Hinton, G.E., Sejinowski, T.J.: A learning algorithm for boltzmann machines. Cognit. Sci. 9, 147\u2013169 (1985)","journal-title":"Cognit. Sci."},{"key":"1137_CR35","doi-asserted-by":"publisher","first-page":"1860","DOI":"10.1126\/science.269.5232.1860","volume":"269","author":"R Hecht-Nielsen","year":"1995","unstructured":"Hecht-Nielsen, R.: Replicator neural networks for universal optimal source coding. Science 269, 1860\u20131863 (1995)","journal-title":"Science"},{"key":"1137_CR36","doi-asserted-by":"publisher","first-page":"383","DOI":"10.1080\/01621459.1974.10482962","volume":"69","author":"FR Hampel","year":"1974","unstructured":"Hampel, F.R.: The influence curve and its role in robust estimation. J. Am. Stat. Assoc. 69, 383\u2013393 (1974)","journal-title":"J. Am. Stat. Assoc."},{"key":"1137_CR37","series-title":"LNCS","first-page":"170","volume-title":"Outlier detection using replicator neural networks","author":"S Hawkins","year":"2002","unstructured":"Hawkins, S., He, H., Williams, G.J., Baxter, R.A.: DaWaK 2002. In: Kambayashi, Y., Winiwarter, W., Arikawa, M. (eds.) Outlier detection using replicator neural networks. LNCS, vol. 2454, pp. 170\u2013180. Springer, Heidelberg (2002)"},{"key":"1137_CR38","unstructured":"Zhao, X., Liang, J., Cao, F.: A simple and effective outlier detection algorithm for categorical data. Int. J. Mach. Learn. Cyber. 5, 469\u2013477 (2014)"},{"key":"1137_CR39","unstructured":"Zengyou, H., Shengchun, D., Xiaofei, X., Huang, J.Z.: A fast greedy algorithm for outlier mining. Applications of Evolutionary Computing. In: Proceedings of the EvoWorkshops 2006: EvoBIO, EvoCOMNET, EvoHOT EvoIASP, EvoINTERACTION, EvoMUSART, and EvoSTOC. LNCS, vol. 3907, pp. 567\u2013576 (2006)"},{"key":"1137_CR40","doi-asserted-by":"crossref","unstructured":"Zhang, W., Wu, J., Yu, J.: An improved method of outlier detection based on frequent pattern. In: Proceeding of WASE International Conference on Information Engineering (2010)","DOI":"10.1109\/ICIE.2010.97"},{"key":"1137_CR41","doi-asserted-by":"crossref","unstructured":"Otey, M.E., Ghoting, A., Parthasarathy, A.: Fast distributed outlier detection in mixed-attribute data sets. Data Min. Knowl. Discov. (2006)","DOI":"10.1007\/s10618-005-0014-6"}],"container-title":["Cluster Computing"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10586-017-1137-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10586-017-1137-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10586-017-1137-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,25]],"date-time":"2025-06-25T14:46:24Z","timestamp":1750862784000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10586-017-1137-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,9,4]]},"references-count":41,"journal-issue":{"issue":"S5","published-print":{"date-parts":[[2019,9]]}},"alternative-id":["1137"],"URL":"https:\/\/doi.org\/10.1007\/s10586-017-1137-4","relation":{},"ISSN":["1386-7857","1573-7543"],"issn-type":[{"type":"print","value":"1386-7857"},{"type":"electronic","value":"1573-7543"}],"subject":[],"published":{"date-parts":[[2017,9,4]]},"assertion":[{"value":"22 June 2017","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"14 August 2017","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 August 2017","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 September 2017","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}