{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,19]],"date-time":"2025-09-19T08:07:10Z","timestamp":1758269230379,"version":"3.33.0"},"publisher-location":"Berlin, Heidelberg","reference-count":50,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540753971"},{"type":"electronic","value":"9783540753988"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2008]]},"DOI":"10.1007\/978-3-540-75398-8_1","type":"book-chapter","created":{"date-parts":[[2007,12,24]],"date-time":"2007-12-24T05:00:38Z","timestamp":1198472438000},"page":"1-22","source":"Crossref","is-referenced-by-count":6,"title":["Information Theoretic Feature Selection and Projection"],"prefix":"10.1007","author":[{"given":"Deniz","family":"Erdogmus","sequence":"first","affiliation":[]},{"given":"Umut","family":"Ozertem","sequence":"additional","affiliation":[]},{"given":"Tian","family":"Lan","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"doi-asserted-by":"crossref","unstructured":"Duch W, Wieczorek T, Biesiada J, Blachnik M (2004) Comparison of Feature Ranking Methods Based on Information Entropy, Proceedings of International Joint Conference on Neural Networks 1415-1420","key":"1_CR2_1","DOI":"10.1109\/IJCNN.2004.1380157"},{"key":"1_CR3_1","doi-asserted-by":"publisher","first-page":"305","DOI":"10.1023\/B:VLSI.0000027493.48841.39","volume":"37","author":"D Erdogmus","year":"2004","unstructured":"Erdogmus D, Principe J C (2004) Lower and Upper Bounds for Misclassification Probability Based on Renyi\u2019s Information, Journal of VLSI Signal Processing Systems 37:305-317","journal-title":"Journal of VLSI Signal Processing Systems"},{"key":"1_CR4_1","volume-title":"Transmission of Information: A Statistical Theory of Communications","author":"R M Fano","year":"1961","unstructured":"Fano R M (1961) Transmission of Information: A Statistical Theory of Communications, Wiley, New York"},{"key":"1_CR5_1","doi-asserted-by":"publisher","first-page":"368","DOI":"10.1109\/TIT.1970.1054466","volume":"16","author":"M E Hellman","year":"1970","unstructured":"Hellman M E, Raviv J (1970) Probability of Error, Equivocation and the Chernoff Bound, IEEE Transactions on Information Theory 16:368-372","journal-title":"IEEE Transactions on Information Theory"},{"unstructured":"Koller D, Sahami M (1996) Toward Optimal Feature Selection, Proceedings of the International Conference on Machine Learning 284-292","key":"1_CR6_1"},{"key":"1_CR7_1","doi-asserted-by":"publisher","first-page":"537","DOI":"10.1109\/72.298224","volume":"5","author":"R Battiti","year":"1994","unstructured":"Battiti R (1994) Using Mutual Information for Selecting Features in Supervised Neural Net Learning, Neural Networks 5:537-550","journal-title":"Neural Networks"},{"unstructured":"Bonnlander B V, Weigend A S (1994) Selecting Input Variables Using Mutual Information and Nonparametric Density Estimation, Proceedings of Interna-tional Symposium on Artificial Neural Networks 42-50","key":"1_CR8_1"},{"unstructured":"Yang H, Moody J (2000) Data Visualization and Feature Selection: New Algorithms for Nongaussian Data, Advances in Neural Information Processing Systems 687-693","key":"1_CR9_1"},{"key":"1_CR10_1","volume-title":"Subspace Methods of Pattern Recognition","author":"E Oja","year":"1983","unstructured":"Oja E (1983) Subspace Methods of Pattern Recognition, Wiley, New York"},{"key":"1_CR11_1","volume-title":"Pattern Recognition: A Statistical Approach","author":"P A Devijver","year":"1982","unstructured":"Devijver P A, Kittler J (1982) Pattern Recognition: A Statistical Approach, Prentice Hall, London"},{"key":"1_CR12_1","volume-title":"Introduction to Statistical Pattern Recognition","author":"K Fukunaga","year":"1990","unstructured":"Fukunaga K (1990) Introduction to Statistical Pattern Recognition, Academic, New York"},{"key":"1_CR13_1","doi-asserted-by":"publisher","first-page":"1957","DOI":"10.1162\/089976699300016043","volume":"11","author":"R Everson","year":"2003","unstructured":"Everson R, Roberts S (2003) Independent Component Analysis: A Flexible Nonlinearity and Decorrelating Manifold Approach, Neural Computation 11:1957-1983","journal-title":"Neural Computation"},{"doi-asserted-by":"crossref","unstructured":"Hyv\u00e4rinen A, Oja E, Hoyer P, Hurri J (1998) Image Feature Extraction by Sparse coding and Independent Component Analysis, Proceedings of ICPR 1268-1273","key":"1_CR14_1","DOI":"10.1109\/ICPR.1998.711932"},{"key":"1_CR15_1","doi-asserted-by":"publisher","first-page":"1415","DOI":"10.1162\/153244303322753742","volume":"3","author":"K Torkkola","year":"2003","unstructured":"Torkkola K (2003) Feature Extraction by Non-Parametric Mutual Information Maximization, Journal of Machine Learning Research 3:1415-1438","journal-title":"Journal of Machine Learning Research"},{"key":"1_CR16_1","doi-asserted-by":"publisher","first-page":"537","DOI":"10.1109\/72.298224","volume":"5","author":"R Battiti","year":"1994","unstructured":"Battiti R (1994) Using Mutual Information for Selecting Features in Supervised Neural Net Training, IEEE Transaction Neural Networks 5:537-550","journal-title":"IEEE Transaction Neural Networks"},{"unstructured":"Kira K, Rendell L (1992) The Feature Selection Problem: Traditional Methods and a New Algorithm, Proceedings of Conference on Artificial Intelligence 129-134","key":"1_CR17_1"},{"doi-asserted-by":"crossref","unstructured":"John G H, Kohavi R, Pfleger K (1994) Irrelevant Features and the Subset Selection Problem, Proceedings of Conference on Machine Learning 121-129","key":"1_CR18_1","DOI":"10.1016\/B978-1-55860-335-6.50023-4"},{"key":"1_CR19_1","doi-asserted-by":"publisher","first-page":"1385","DOI":"10.1109\/TPAMI.2006.186","volume":"28","author":"II K E Hild","year":"2006","unstructured":"Hild II K E, Erdogmus D, Torkkola K, Principe J C (2006) Feature Extraction Using Information-Theoretic Learning, IEEE Transactions on Pattern Analysis and Machine Intelligence 28:1385-1392","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"1_CR20_1","doi-asserted-by":"publisher","first-page":"1157","DOI":"10.1162\/153244303322753616","volume":"3","author":"I Guyon","year":"2003","unstructured":"Guyon I, Elisseeff A (2003) An Introduction to Variable and Feature Selection, Journal of Machine Learning Research 3:1157-1182 (Special Issue on Variable and Feature Selection)","journal-title":"Journal of Machine Learning Research"},{"key":"1_CR21_1","doi-asserted-by":"publisher","first-page":"1299","DOI":"10.1162\/089976698300017467","volume":"10","author":"B Scholkopf","year":"1998","unstructured":"Scholkopf B, Smola A, Muller K R (1998) Nonlinear Component Analysis as a Kernel Eigenvalue Problem, Neural Computation 10:1299-1319","journal-title":"Neural Computation"},{"key":"1_CR22_1","doi-asserted-by":"publisher","DOI":"10.1002\/0471221317","volume-title":"Independent Component Analysis","author":"A Hyvarinen","year":"2001","unstructured":"Hyvarinen A, Karhunen J, Oja E (2001) Independent Component Analysis, Wiley, New York"},{"key":"1_CR23_1","doi-asserted-by":"publisher","first-page":"788","DOI":"10.1038\/44565","volume":"401","author":"D D Lee","year":"1999","unstructured":"Lee D D, Seung H S (1999) Learning the parts of objects by non-negative matrix factorization, Nature 401:788-791","journal-title":"Nature"},{"key":"1_CR24_1","doi-asserted-by":"publisher","first-page":"2323","DOI":"10.1126\/science.290.5500.2323","volume":"290","author":"S Roweis","year":"2000","unstructured":"Roweis S, Saul L (2000) Nonlinear Dimensionality Reduction by Locally Linear Embedding, Science 290:2323-2326","journal-title":"Science"},{"key":"1_CR25_1","first-page":"1077","volume":"5","author":"J Costa","year":"2005","unstructured":"Costa J, Hero A O (2005) Classification Constrained Dimensionality Reduction, Proceedings of ICASSP 5:1077-1080","journal-title":"Proceedings of ICASSP"},{"key":"1_CR26_1","doi-asserted-by":"publisher","first-page":"2385","DOI":"10.1162\/089976600300014980","volume":"12","author":"G Baudat","year":"2000","unstructured":"Baudat G, Anouar F (2000) Generalized Discriminant Analysis Using a Kernel Approach, Neural Computation 12:2385-2404","journal-title":"Neural Computation"},{"key":"1_CR27_1","first-page":"265","volume-title":"Unsupervised Adaptive Filtering","author":"J C Principe","year":"2000","unstructured":"Principe J C, Fisher J W, Xu D (2000) Information Theoretic Learning, In Haykin S (Ed.) Unsupervised Adaptive Filtering, Wiley, New York, 265-319"},{"key":"1_CR28_1","volume-title":"On Estimation of a Probability Density Function and Mode, Time Series Analysis Papers","author":"E Parzen","year":"1967","unstructured":"Parzen E (1967) On Estimation of a Probability Density Function and Mode, Time Series Analysis Papers, Holden-Day, San Diego, California"},{"key":"1_CR29_1","volume-title":"Information Theoretic Learning: Renyi\u2019s Entropy and its Applications to Adaptive System Training","author":"D Erdogmus","year":"2002","unstructured":"Erdogmus D (2002) Information Theoretic Learning: Renyi\u2019s Entropy and its Applications to Adaptive System Training, PhD Dissertation, University of Florida, Gainesville, Florida"},{"key":"1_CR30_1","doi-asserted-by":"publisher","first-page":"066138","DOI":"10.1103\/PhysRevE.69.066138","volume":"69","author":"A Kraskov","year":"2004","unstructured":"Kraskov A, Stoegbauer H, Grassberger P (2004) Estimating Mutual Information, Physical Review E 69:066138","journal-title":"Physical Review E"},{"key":"1_CR31_1","doi-asserted-by":"publisher","first-page":"1271","DOI":"10.1162\/jmlr.2003.4.7-8.1271","volume":"4","author":"E G Learned-Miller","year":"2003","unstructured":"Learned-Miller E G, Fisher J W (2003) ICA Using Spacings Estimates of Entropy, Journal of Machine Learning Research 4:1271-1295","journal-title":"Journal of Machine Learning Research"},{"key":"1_CR32_1","doi-asserted-by":"crossref","first-page":"54","DOI":"10.1111\/j.2517-6161.1976.tb01566.x","volume":"38","author":"O Vasicek","year":"1976","unstructured":"Vasicek O, (1976) A Test for Normality Based on Sample Entropy, Journal of the Royal Statistical Society B 38:54-59","journal-title":"Journal of the Royal Statistical Society B"},{"key":"1_CR33_1","doi-asserted-by":"publisher","first-page":"85","DOI":"10.1109\/MSP.2002.1028355","volume":"19","author":"A O Hero","year":"2002","unstructured":"Hero A O, Ma B, Michel O J J, Gorman J (2002) Applications of Entropic Spanning Graphs, IEEE Signal Processing Magazine 19:85-95","journal-title":"IEEE Signal Processing Magazine"},{"key":"1_CR34_1","first-page":"17","volume":"6","author":"J Beirlant","year":"1997","unstructured":"Beirlant J, Dudewicz E J, Gyorfi L, Van Der Meulen E C (1997) Nonparametric Entropy Estimation: An Overview, International Journal of Mathematical and Statistical Sciences 6:17-39","journal-title":"International Journal of Mathematical and Statistical Sciences"},{"key":"1_CR35_1","doi-asserted-by":"publisher","first-page":"1780","DOI":"10.1109\/TSP.2002.1011217","volume":"50","author":"D Erdogmus","year":"2002","unstructured":"Erdogmus D, Principe J C (2002) An Error-Entropy Minimization Algorithm for Supervised Training of Nonlinear Adaptive Systems, IEEE Transactions on Signal Processing 50:1780-1786","journal-title":"IEEE Transactions on Signal Processing"},{"issue":"6","key":"1_CR36_1","doi-asserted-by":"publisher","first-page":"14","DOI":"10.1109\/SP-M.2006.248709","volume":"23","author":"D Erdogmus","year":"2006","unstructured":"Erdogmus D, Principe J C (2006) From Linear Adaptive Filtering to Nonlinear Information Processing, IEEE Signal Processing Magazine 23(6):14-33","journal-title":"IEEE Signal Processing Magazine"},{"key":"1_CR37_1","doi-asserted-by":"publisher","first-page":"1235","DOI":"10.1162\/089976604773717595","volume":"16","author":"D Erdogmus","year":"2004","unstructured":"Erdogmus D, Hild II K E, Rao Y N, Principe J C (2004) Minimax Mutual Infor-mation Approach for Independent Components Analysis, Neural Computation 16:1235-1252","journal-title":"Neural Computation"},{"key":"1_CR38_1","doi-asserted-by":"publisher","first-page":"669","DOI":"10.1162\/089976602317250942","volume":"14","author":"M Girolami","year":"2002","unstructured":"Girolami M (2002) Orthogonal Series Density Estimation and the Kernel Eigenvalue Problem, Neural Computation, MIT Press 14:669-688","journal-title":"Neural Computation, MIT Press"},{"key":"1_CR39_1","volume-title":"Pattern Classification","author":"R O Duda","year":"2000","unstructured":"Duda R O, Hart P E, Stork D G (2000) Pattern Classification (2nd ed.), Wiley, New York"},{"key":"1_CR40_1","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4613-0125-7","volume-title":"Combinatorial Methods in Density Estimation","author":"L Devroye","year":"2001","unstructured":"Devroye L, Lugosi G (2001) Combinatorial Methods in Density Estimation, Springer, Berlin Heidelberg New York"},{"key":"1_CR41_1","volume-title":"Probability Theory","author":"A Renyi","year":"1970","unstructured":"Renyi A (1970) Probability Theory, North-Holland, Amsterdam"},{"key":"1_CR42_1","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4899-3324-9","volume-title":"Density Estimation for Statistics and Data Analysis","author":"B W Silverman","year":"1986","unstructured":"Silverman B W, (1986) Density Estimation for Statistics and Data Analysis, Chapman and Hall, London"},{"key":"1_CR43_1","doi-asserted-by":"publisher","first-page":"1175","DOI":"10.1109\/TC.1976.1674577","volume":"25","author":"R P W Duin","year":"1976","unstructured":"Duin R P W (1976) On the Choice of the Smoothing Parameters for Parzen Estimators of Probability Density Functions, IEEE Transactions on Computers 25:1175-1179","journal-title":"IEEE Transactions on Computers"},{"key":"1_CR44_1","doi-asserted-by":"publisher","first-page":"828","DOI":"10.1109\/TNN.2004.828766","volume":"15","author":"N Schraudolph","year":"2004","unstructured":"Schraudolph N (2004) Gradient-Based Manipulation of Nonparametric Entropy Estimates, IEEE Transactions on Neural Networks 15:828-837","journal-title":"IEEE Transactions on Neural Networks"},{"key":"1_CR45_1","doi-asserted-by":"publisher","first-page":"415","DOI":"10.1098\/rsta.1909.0016","volume":"209","author":"J Mercer","year":"1909","unstructured":"Mercer J (1909) Functions of Positive and Negative Type, and Their Connection with the Theory of Integral Equations, Transactions of the London Philosophical Society A 209:415-446","journal-title":"Transactions of the London Philosophical Society A"},{"key":"1_CR46_1","doi-asserted-by":"crossref","DOI":"10.1137\/1.9781611970128","volume-title":"Spline Models for Observational Data","author":"G Wahba","year":"1990","unstructured":"Wahba G (1990) Spline Models for Observational Data, SIAM, Philedelphia, Pennsylvania"},{"volume-title":"Reproducing Kernel Hilbert Spaces: Applications in Statistical Signal Processing","year":"1982","unstructured":"Weinert H (ed.) (1982) Reproducing Kernel Hilbert Spaces: Applications in Statistical Signal Processing, Hutchinson Ross Publisher Co., Stroudsburg, Pennsylvania","key":"1_CR47_1"},{"key":"1_CR48_1","first-page":"298","volume":"23","author":"C Fowlkes","year":"2004","unstructured":"Fowlkes C, Belongie S, Chung F, Malik J (2004) Spectral Grouping Using the Nystrom Method, IEEE Transactions on Pattern Analysis and Machine Intelligence 23:298-305","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"1_CR49_1","doi-asserted-by":"publisher","first-page":"1241","DOI":"10.1016\/j.patcog.2006.01.014","volume":"39","author":"U Ozertem","year":"2006","unstructured":"Ozertem U, Erdogmus D, Jenssen R (2006) Spectral Feature Projections That Maximize Shannon Mutual Information with Class Labels, Pattern Recognition 39:1241-1252","journal-title":"Pattern Recognition"},{"key":"1_CR50_1","doi-asserted-by":"publisher","first-page":"75","DOI":"10.1016\/0893-6080(88)90023-8","volume":"1","author":"R P Gorman","year":"1988","unstructured":"Gorman R P, Sejnowski T J (1988) Analysis of Hidden Units in a Layered Network Trained to Classify Sonar Targets, Neural Networks 1:75-79","journal-title":"Neural Networks"},{"unstructured":"http:\/\/www.ics.uci.edu\/mlearn\/MLRepository.html","key":"1_CR51_1"}],"container-title":["Studies in Computational Intelligence","Speech, Audio, Image and Biomedical Signal Processing using Neural Networks"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-540-75398-8_1.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,24]],"date-time":"2025-01-24T19:48:37Z","timestamp":1737748117000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-540-75398-8_1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2008]]},"ISBN":["9783540753971","9783540753988"],"references-count":50,"URL":"https:\/\/doi.org\/10.1007\/978-3-540-75398-8_1","relation":{},"ISSN":["1860-949X"],"issn-type":[{"type":"print","value":"1860-949X"}],"subject":[],"published":{"date-parts":[[2008]]}}}