{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,16]],"date-time":"2025-10-16T09:57:53Z","timestamp":1760608673799},"publisher-location":"Berlin, Heidelberg","reference-count":25,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642253232"},{"type":"electronic","value":"9783642253249"}],"license":[{"start":{"date-parts":[[2011,1,1]],"date-time":"2011-01-01T00:00:00Z","timestamp":1293840000000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2011]]},"DOI":"10.1007\/978-3-642-25324-9_31","type":"book-chapter","created":{"date-parts":[[2011,11,21]],"date-time":"2011-11-21T13:04:10Z","timestamp":1321880650000},"page":"357-369","source":"Crossref","is-referenced-by-count":9,"title":["Instance Selection in Text Classification Using the Silhouette Coefficient Measure"],"prefix":"10.1007","author":[{"given":"Debangana","family":"Dey","sequence":"first","affiliation":[]},{"given":"Thamar","family":"Solorio","sequence":"additional","affiliation":[]},{"given":"Manuel","family":"Montes y G\u00f3mez","sequence":"additional","affiliation":[]},{"given":"Hugo Jair","family":"Escalante","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"31_CR1","unstructured":"Settles, B.: Active Learning Literature Surve, Computer Sciences Technical Report 1648. University of Wisconsin\u2013Madison (2009)"},{"key":"31_CR2","doi-asserted-by":"crossref","unstructured":"Hubert, M., Struyf, A., Rousseeuw, P.: Clustering in an Object-Oriented Environment. Journal of Statistical Software\u00a01(4) (1996)","DOI":"10.18637\/jss.v001.i04"},{"key":"31_CR3","doi-asserted-by":"crossref","unstructured":"Czarnowski, I.: Cluster-based instance selection for machine classification. Knowledge and Information Systems (2011)","DOI":"10.1007\/s10115-010-0375-z"},{"key":"31_CR4","unstructured":"Slonim, N., Tishby, N.: Agglomerative Information Bottleneck. In: Advances in Neural Information Processing systems (NIPS-12) (1999)"},{"key":"31_CR5","doi-asserted-by":"crossref","unstructured":"Baker, L.D., McCallum, A.K.: Distributional clustering of words for text classification. In: Proc. of the 21st Annual International ACM SIGIR Conference on Research and Development in Information Retrieval - SIGIR 1998, pp. 96\u2013103 (1998)","DOI":"10.1145\/290941.290970"},{"key":"31_CR6","first-page":"1265","volume":"3","author":"I.S. Dhillon","year":"2003","unstructured":"Dhillon, I.S., Mallela, S., Kumar, R.: A Divisive Information-Theoretic Feature Clustering Algorithm for Text Classification. Journal of Machine Learning Research\u00a03, 1265\u20131287 (2003)","journal-title":"Journal of Machine Learning Research"},{"key":"31_CR7","doi-asserted-by":"crossref","unstructured":"Olvera-L\u00f3pez, J.A., Carrasco-Ochoa, J.A., Mart\u00ednez-Trinidad, J.F.: Object selection based on clustering and border objects. In: Kurzynski, M., et al. (eds.) Computer Recognition Systems 2, Wroclaw, Poland. ASC, vol.\u00a045, pp. 27\u201334 (2007)","DOI":"10.1007\/978-3-540-75175-5_4"},{"key":"31_CR8","unstructured":"Martinez, T.R.: Reduction Techniques for Instance-Based Learning Algorithms. Machine Learning\u00a0286 (2000)"},{"key":"31_CR9","unstructured":"Brighton, H.: Advances in Instance Selection for Instance-Based Learning. Algorithms. Knowledge Creation Diffusion Utilization, 153\u2013172 (2002)"},{"key":"31_CR10","doi-asserted-by":"publisher","first-page":"495","DOI":"10.1016\/j.patcog.2005.11.004","volume":"39","author":"A. Lumini","year":"2006","unstructured":"Lumini, A., Nanni, L.: A clustering method for automatic biometric template selection. Pattern Recognition\u00a039, 495\u2013497 (2006)","journal-title":"Pattern Recognition"},{"key":"31_CR11","series-title":"Lecture Notes in Artificial Intelligence","doi-asserted-by":"publisher","first-page":"159","DOI":"10.1007\/11846406_20","volume-title":"Text, Speech and Dialogue","author":"K. Shin","year":"2006","unstructured":"Shin, K., Abraham, A., Han, S.-Y.: Enhanced Centroid-Based Classification Technique by Filtering Outliers. In: Sojka, P., Kope\u010dek, I., Pala, K. (eds.) TSD 2006. LNCS (LNAI), vol.\u00a04188, pp. 159\u2013163. Springer, Heidelberg (2006)"},{"key":"31_CR12","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1111\/0824-7935.00103","volume":"16","author":"D.R. Wilson","year":"2000","unstructured":"Wilson, D.R., Martinez, T.R.: An Integrated Instance-Based Learning Algorithm. Computational Intelligence\u00a016, 1\u201328 (2000)","journal-title":"Computational Intelligence"},{"key":"31_CR13","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"153","DOI":"10.1007\/978-3-540-85920-8_19","volume-title":"Progress in Pattern Recognition, Image Analysis and Applications","author":"J.A. Olvera-L\u00f3pez","year":"2008","unstructured":"Olvera-L\u00f3pez, J.A., Carrasco-Ochoa, J.A., Mart\u00ednez-Trinidad, J.F.: Prototype selection via prototype relevance. In: Ruiz-Shulcloper, J., Kropatsch, W.G. (eds.) CIARP 2008. LNCS, vol.\u00a05197, pp. 153\u2013160. Springer, Heidelberg (2008)"},{"key":"31_CR14","doi-asserted-by":"crossref","unstructured":"Kira, K., Rendell, L.A.: A practical approach to feature selection. In: Proc. of 9th International Conference on Machine Learning, pp. 249\u2013256 (1992)","DOI":"10.1016\/B978-1-55860-247-2.50037-1"},{"key":"31_CR15","doi-asserted-by":"crossref","unstructured":"Hall, M., Frank, E., Holmes, G., Bernhard, P., Reutemann, P., Witten, I.H.: The WEKA Data Mining Software: An Update. SIGKDD Explorations\u00a011(1) (2009)","DOI":"10.1145\/1656274.1656278"},{"key":"31_CR16","unstructured":"Classic4 Dataset, ftp:\/\/ftp.cs.cornell.edu\/pub\/smart\/"},{"key":"31_CR17","unstructured":"Reuters R8 Dataset, http:\/\/www.daviddlewis.com\/resources\/testcollections\/reuters21578"},{"key":"31_CR18","unstructured":"20 Newsgroup Dataset, http:\/\/people.csail.mit.edu\/jrennie\/public_html\/20Newsgroup\/"},{"key":"31_CR19","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1016\/0377-0427(87)90125-7","volume":"20","author":"P.J. Rousseeuw","year":"1987","unstructured":"Rousseeuw, P.J.: Silhouettes: a Graphical Aid to the Interpretation and Validation of Cluster Analysis. Computational and Applied Mathematics\u00a020, 53\u201365 (1987), doi:10.1016\/0377-0427(87)90125-7","journal-title":"Computational and Applied Mathematics"},{"issue":"7","key":"31_CR20","doi-asserted-by":"publisher","first-page":"1148","DOI":"10.1093\/comjnl\/bxq069","volume":"54","author":"D. Pinto","year":"2011","unstructured":"Pinto, D., Rosso, P., Jim\u00e9nez-Salazar, H.: A Self-enriching Methodology for Clustering Narrow Domain Short Texts. Computer Journal\u00a054(7), 1148\u20131165 (2011)","journal-title":"Computer Journal"},{"issue":"7","key":"31_CR21","doi-asserted-by":"publisher","first-page":"1148","DOI":"10.1093\/comjnl\/bxq069","volume":"54","author":"D. Pinto","year":"2011","unstructured":"Pinto, D., Rosso, P., Jim\u00e9nez-Salazar, H.: A Self-enriching Methodology for Clustering Narrow Domain Short Texts. Computer Journal\u00a054(7), 1148\u20131165 (2011)","journal-title":"Computer Journal"},{"key":"31_CR22","volume-title":"Human Behavior and the Principle of Last-Effort","author":"G.K. Zipf","year":"1949","unstructured":"Zipf, G.K.: Human Behavior and the Principle of Last-Effort. Addison-Wesley, Cambridge (1949)"},{"key":"31_CR23","doi-asserted-by":"crossref","unstructured":"Booth, A.: A Law of Ocurrences for Words of Low Frequency. Information and Control (1967)","DOI":"10.1016\/S0019-9958(67)90201-X"},{"key":"31_CR24","unstructured":"Urbizag\u00e1stegui, R.: Las posibilidades de la Ley de Zipf en la indizaci\u00f3n autom\u00e1tica, Research report of the California Riverside University (1999)"},{"key":"31_CR25","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"536","DOI":"10.1007\/11671299_55","volume-title":"Computational Linguistics and Intelligent Text Processing","author":"D. Pinto","year":"2006","unstructured":"Pinto, D., Jim\u00e9nez-Salazar, H., Rosso, P.: Clustering Abstracts of Scientific Texts Using the Transition Point Technique. In: Gelbukh, A.F. (ed.) CICLing 2006. LNCS, vol.\u00a03878, pp. 536\u2013546. Springer, Heidelberg (2006)"}],"container-title":["Lecture Notes in Computer Science","Advances in Artificial Intelligence"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-25324-9_31","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,6,19]],"date-time":"2019-06-19T22:00:35Z","timestamp":1560981635000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-25324-9_31"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2011]]},"ISBN":["9783642253232","9783642253249"],"references-count":25,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-25324-9_31","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2011]]}}}