{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,2]],"date-time":"2026-06-02T21:09:08Z","timestamp":1780434548686,"version":"3.54.1"},"reference-count":34,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2006,3,31]],"date-time":"2006-03-31T00:00:00Z","timestamp":1143763200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Knowl Inf Syst"],"published-print":{"date-parts":[[2006,12,4]]},"DOI":"10.1007\/s10115-005-0233-6","type":"journal-article","created":{"date-parts":[[2006,4,4]],"date-time":"2006-04-04T12:13:36Z","timestamp":1144152816000},"page":"45-84","source":"Crossref","is-referenced-by-count":62,"title":["Capabilities of outlier detection schemes in large datasets, framework and methodologies"],"prefix":"10.1007","volume":"11","author":[{"given":"Jian","family":"Tang","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Zhixiang","family":"Chen","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Ada Waichee","family":"Fu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"David W.","family":"Cheung","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2006,3,31]]},"reference":[{"key":"233_CR1","doi-asserted-by":"crossref","unstructured":"Aggarwal C, Yu P (2001) Outlier detection for high dimensional data. In: Aref WG (ed) Proceedings of the 2001 ACM-SIGMOD international conference on management of data, Santa Barbara, CA, USA, May 2001, ACM, pp 37\u201346","DOI":"10.1145\/375663.375668"},{"key":"233_CR2","doi-asserted-by":"crossref","unstructured":"Angiulli F, Pizzuti C (2002) Fast outlier detection in high dimensional spaces. In: Tapio Elomaa, Heikki Mannila, Hannu Toivonen (eds) Principles of data mining and knowledge discovery, proceedings of the 6th European PKDD conference, Helsinki, Finland, August 2002. Lecture notes in computer science, vol 2431. Springer, Berlin Heidelberg New York, pp 15\u201326","DOI":"10.1007\/3-540-45681-3_2"},{"key":"233_CR3","unstructured":"Arning A, Aggarwal R, Raghavan P (1996) A linear method for deviation detection in large databases. In: Simoudis E, Han J, Fayyad UM (eds) Proceedings of the second international conference on knowledge discovery and data mining (KDD96), Portland, Oregon, USA, 1996. AAAI Press, pp 164\u2013169"},{"key":"233_CR4","volume-title":"Modern information retrieval","author":"R Baeza-Yates","year":"1999","unstructured":"Baeza-Yates R, Ribeiro-Neto B (1999) Modern information retrieval. Addison Wesley, Reading, MA"},{"key":"233_CR5","doi-asserted-by":"crossref","unstructured":"Bay SD, Schwabacher M (2003) Mining distance-based outliers in near linear time with randomization and a simple pruning rule. In: Getoor L, Senator TE, Domingos P, Faloutsos C (eds) Proceedings of the ninth ACM SIGKDD international conference on knowledge discovery and data mining, Washington, DC, USA, August 2003. ACM, pp 29\u201338","DOI":"10.1145\/956750.956758"},{"key":"233_CR6","volume-title":"Outliers in statistical data","author":"V Barnett","year":"1994","unstructured":"Barnett V, Lewis T (1994) Outliers in statistical data. Wiley, New York"},{"key":"233_CR7","unstructured":"Blake CL, Merz CJ (1998) UCI Repository of machine learning databases. http:\/\/www.ics.uci.edu\/mlearn\/MLRepository.html . Department of Information and Computer Science, University of California, Irvine, CA"},{"key":"233_CR8","doi-asserted-by":"crossref","unstructured":"Breuning M, Kriegel H, Ng R, Sander J (2000) LOF: identifying density-based local outliers. In: Chen W, Naughton JF, Bernstein PA (eds) Proceedings of the 2000 ACM SIGMOD international conference on management of data, Dallas, Texas, USA, May 2000. ACM, pp 427\u2013438","DOI":"10.1145\/342009.335388"},{"key":"233_CR9","doi-asserted-by":"crossref","unstructured":"Chen Z, Fu A, Tang J (2003) On complementarity of cluster and outlier detection schemes. In: Kambayashi Y, Mohania MK, W\u00f3\u00df W (eds) Data warehousing and knowledge discovery, proceedings of the 5th international DaWaK conference, Prague, Czech Republic, September 2003. Lecture notes in computer science, vol 2737. Springer, Berlin Heidelberg New York, pp 234\u2013243","DOI":"10.1007\/978-3-540-45228-7_24"},{"key":"233_CR10","unstructured":"Chen Z, Tang J, Fu A (2003) Modeling and efficient mining of intentional knowledge of outliers. In: Proceedings of the 7th international database engineering and applications symposium (IDEAS03), Hong Kong, China, July 2003. IEEE Computer Society, pp 44\u201353"},{"issue":"8","key":"233_CR11","doi-asserted-by":"crossref","first-page":"655","DOI":"10.1002\/asi.1115","volume":"52","author":"Z Chen","year":"2001","unstructured":"Chen Z, Meng X, Fowler R, Zhu B (2001) FEATURES: real-time adaptive feature and document learning for web search. J Am Soc Inform Sci Technol 52(8):655\u2013665","journal-title":"J Am Soc Inform Sci Technol"},{"key":"233_CR12","volume-title":"Introduction to algorithms","author":"T Cormen","year":"2002","unstructured":"Cormen T, Leiserson C, Rivest R, Stein C (2002) Introduction to algorithms, 2nd edn. McGraw-Hill, New York","edition":"2nd edn."},{"key":"233_CR13","unstructured":"DuMouchel W, Schonlau M (1998) A fast computer intrusion detection algorithm based on hypothesis testing of command transition probabilities. In: Agrawal R, Stolorz PE, Piatetsky-Shapiro G (eds) Proceedings of the fourth international conference on knowledge discovery and data mining (KDD98), New York City, New York, USA, August 1998. AAAI Press, pp 189\u2013193"},{"key":"233_CR14","unstructured":"Ester M, Kriegel H, Sander J, Xu X (1996) A density-based algorithm for discovering clusters in large spatial databases with noise. In: Simoudis E, Han J, Fayyad UM (eds) Proceedings of the second international conference on knowledge discovery and data mining (KDD96), 1996. AAAI Press, pp 226\u2013231"},{"issue":"3","key":"233_CR15","doi-asserted-by":"crossref","first-page":"291","DOI":"10.1023\/A:1009700419189","volume":"1","author":"T Fawcett","year":"1997","unstructured":"Fawcett T, Provost F (1997) Adaptive fraud detection. Data Min Knowledge Discov J 1(3):291\u2013316","journal-title":"Data Min Knowledge Discov J"},{"key":"233_CR16","doi-asserted-by":"crossref","unstructured":"Guha S, Rastogi R, Shim K (1998) Cure: an efficient clustering algorithm for large databases. In: Haas LM, Tiwary A (eds) Proceedings ACM SIGMOD international conference on management of data, Seattle, Washington, USA, June 1998. ACM Press, pp 73\u201384","DOI":"10.1145\/276304.276312"},{"key":"233_CR17","doi-asserted-by":"crossref","unstructured":"Harkins S, He H, Williams CJ, Baster RA (2002) Outlier detection using replicator neural networks. In: Kambayashi Y, Winiwarter W, Arikawa M (eds) Data warehousing and knowledge discovery, proceedings of the 4th international DaWaK conference, Aix-en-Provence, France, September 2002. Lecture notes in computer science, vol 2454. Springer, Berlin Heidelberg New York, pp 170\u2013180","DOI":"10.1007\/3-540-46145-0_17"},{"key":"233_CR18","doi-asserted-by":"crossref","DOI":"10.1007\/978-94-015-3994-4","volume-title":"Identification of outliers","author":"D Hawkins","year":"1980","unstructured":"Hawkins D (1980) Identification of outliers. Chapman & Hall, London"},{"key":"233_CR19","doi-asserted-by":"crossref","first-page":"1641","DOI":"10.1016\/S0167-8655(03)00003-5","volume":"24","author":"Z He","year":"2003","unstructured":"He Z, Xu X, Deng S (2003) Discovering cluster-based local outliers. Pattern Recog Lett 24:1641\u20131650","journal-title":"Pattern Recog Lett"},{"key":"233_CR20","first-page":"3509","volume":"24","author":"T Hu","year":"2003","unstructured":"Hu T, Sung SY (2003) Detecting pattern-based outliers. Pattern Recog Lett 24:3509\u20133068","journal-title":"Pattern Recog Lett"},{"key":"233_CR21","doi-asserted-by":"crossref","unstructured":"Jin W, Tung A, Han J (2001) Mining top-n local outliers in large databases. In: Proceedings of the seventh ACM SIGKDD international conference on knowledge discovery and data mining, San Francisco, CA, USA, August 2001. ACM, pp 293\u2013298","DOI":"10.1145\/502512.502554"},{"issue":"4","key":"233_CR22","doi-asserted-by":"crossref","first-page":"349","DOI":"10.1023\/A:1024988512476","volume":"7","author":"E Keogh","year":"2003","unstructured":"Keogh E, Kasetty S (2003) On the need for time series data mining benchmarks: a survey and empirical demonstration. Data Min Knowledge Discov 7(4):349\u2013371","journal-title":"Data Min Knowledge Discov"},{"key":"233_CR23","unstructured":"Knorr E, Ng R (1998) Algorithms for mining distance-based outliers in large datasets. In: Gupta A, Shmueli O, Widom J (eds) Proceedings of 24rd international conference on very large databases, New York City, New York, USA, August 1998. Morgan Kaufmann, pp 392\u2013403"},{"key":"233_CR24","unstructured":"Knorr E, Ng R (1999) Finding intentional knowledge of distance-based outliers. In: Atkinson MP, Orlowska ME, Valduriez P, Zdonik SB, Brodie ML (eds) Proceedings of the 25th international conference on very large databases, Edinburgh, Scotland, UK, September 1999. Morgan Kaufmann, pp 211\u2013222"},{"key":"233_CR25","doi-asserted-by":"crossref","unstructured":"Lazarevic A, Ertoz L, Ozgur A, Srivastava J, Kumar V (2003) A comparative study of anomaly detection schemes in network intrusion detection. In: Barbar D, Kamath C (eds) Proceedings of the third SIAM international conference on data mining, San Francisco, CA, USA, May 2003. SIAM","DOI":"10.1137\/1.9781611972733.3"},{"key":"233_CR26","unstructured":"Meng X, Chen Z (2004) On user-oriented measurements of effectiveness of web information retrieval systems. In: Arabnia HR, Droegehorn O (eds) Proceedings of the international conference on internet computing, Las Vegas, Nevada, USA, June 2004, vol 1. CSREA Press, pp 527\u2013533"},{"key":"233_CR27","unstructured":"Ng R, Han J (1994) Efficient and effective clustering methods for spatial data mining. In: Bocca JB, Jarke M, Zaniolo C (eds) Proceedings of the 20th international conference on very large databases, Santiago de Chile, Chile, September 1994. Morgan Kaufmann, pp 144\u2013155"},{"key":"233_CR28","doi-asserted-by":"crossref","unstructured":"Ramaswamy S, Rastogi R, Kyuseok S (2000) Efficient algorithms for mining outliers from large data sets. In: Chen W, Naughton JF, Bernstein PA (eds) Proceedings of the 2000 ACM SIGMOD international conference on management of data, Dallas, Texas, USA, May 2000. ACM, pp 427\u2013438","DOI":"10.1145\/342009.335437"},{"key":"233_CR29","doi-asserted-by":"crossref","unstructured":"Roussopoulos N, Kelley S, Vincent F (1995) Nearest neighbor queries. In: Carey MJ, Schneider DA (eds) Proceedings of the 1995 ACM SIGMOD international conference on management of data, San Jose, California, USA, May 1995. ACM, pp 71\u201379","DOI":"10.1145\/223784.223794"},{"key":"233_CR30","volume-title":"Automated text processing: the transformation, analysis, and retrieval of information by computer","author":"G Salton","year":"1989","unstructured":"Salton G (1989) Automated text processing: the transformation, analysis, and retrieval of information by computer. Addison Wesley, Reading, MA"},{"key":"233_CR31","unstructured":"Sheikholeslami G, Chatterjee S, Zhang A (1998) WaveCluster: a multi-resolution clustering approach for very large spatial databases. In: Gupta A, Shmueli O, Widom J (eds) Proceedings of 24rd international conference on very large databases, New York City, New York, USA, August 1998. Morgan Kaufmann, pp 428\u2013439"},{"key":"233_CR32","unstructured":"Stolfo S, Fan W, Lee W, Prodromidis A, Chan P (2000) Cost-based modeling for fraud and intrusion detection: results from the JAM Project. In: Proceedings of DARPA information survivability conference and exposition, vol 2, pp 1130\u20131144"},{"key":"233_CR33","doi-asserted-by":"crossref","unstructured":"Tang J, Chen Z, Fu A, Cheung D (2002) Enhancing effectiveness of outlier detections for low density patterns. In: Cheng M-S, Yu PS, Liu B (eds) Advances in knowledge discovery and data mining, proceedings of the 6th Pacific-Asia PAKDD conference, Taipei, Taiwan, May 2002. Lecture notes in computer science, vol 2336. Springer, Berlin Heidelberg New York, pp 535\u2013548","DOI":"10.1007\/3-540-47887-6_53"},{"key":"233_CR34","doi-asserted-by":"crossref","unstructured":"Zhang T, Ramakrishnan R, Linvy M (1996) BIRCH: an efficient data clustering method for very large databases. In: Jagadish HV, Mumick IS (eds) Proceedings of the 1996 ACM SIGMOD international conference on management of data, Montreal, Quebec, Canada, June 1996. ACM, pp 103\u2013114","DOI":"10.1145\/233269.233324"}],"container-title":["Knowledge and Information Systems"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10115-005-0233-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10115-005-0233-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10115-005-0233-6","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,29]],"date-time":"2019-05-29T10:10:14Z","timestamp":1559124614000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10115-005-0233-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2006,3,31]]},"references-count":34,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2006,12,4]]}},"alternative-id":["233"],"URL":"https:\/\/doi.org\/10.1007\/s10115-005-0233-6","relation":{},"ISSN":["0219-1377","0219-3116"],"issn-type":[{"value":"0219-1377","type":"print"},{"value":"0219-3116","type":"electronic"}],"subject":[],"published":{"date-parts":[[2006,3,31]]}}}