{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,11]],"date-time":"2026-03-11T13:54:09Z","timestamp":1773237249119,"version":"3.50.1"},"reference-count":66,"publisher":"Elsevier","isbn-type":[{"value":"9780444862174","type":"print"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[1982]]},"DOI":"10.1016\/s0169-7161(82)02038-0","type":"book-chapter","created":{"date-parts":[[2005,4,18]],"date-time":"2005-04-18T19:58:53Z","timestamp":1113854333000},"page":"773-791","source":"Crossref","is-referenced-by-count":96,"title":["35 Use of distance measures, information measures and error bounds in feature evaluation"],"prefix":"10.1016","author":[{"given":"Moshe","family":"Ben-Bassat","sequence":"first","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/S0169-7161(82)02038-0_bib1","series-title":"On Measures of Information and Their Characterization","author":"Aczel","year":"1975"},{"key":"10.1016\/S0169-7161(82)02038-0_bib2","doi-asserted-by":"crossref","first-page":"131","DOI":"10.1111\/j.2517-6161.1966.tb00626.x","article-title":"A general class of coefficients of divergence of one distribution from another","volume":"28","author":"Ali","year":"1966","journal-title":"J. Royal Statis. Soc. Ser. B."},{"key":"10.1016\/S0169-7161(82)02038-0_bib3","series-title":"Proc. Third Internat. Joint Conf. Pattern Recognition","first-page":"45","article-title":"On feature ordering in practice and some finite sample effects","author":"Backer","year":"1976"},{"key":"10.1016\/S0169-7161(82)02038-0_bib4","doi-asserted-by":"crossref","first-page":"170","DOI":"10.1109\/TC.1978.1675054","article-title":"Myopic policies in sequential classification","volume":"27","author":"Ben-Bassat","year":"1978","journal-title":"IEEE Trans. Comput."},{"key":"10.1016\/S0169-7161(82)02038-0_bib5","doi-asserted-by":"crossref","first-page":"769","DOI":"10.1109\/TIT.1978.1055952","article-title":"\u03b5-equivalence of feature selection rules","volume":"24","author":"Ben-Bassat","year":"1978","journal-title":"IEEE Trans. Inform. Theory"},{"key":"10.1016\/S0169-7161(82)02038-0_bib6","doi-asserted-by":"crossref","first-page":"227","DOI":"10.1016\/S0019-9958(78)90587-9","article-title":"f-entropies, probabilities of error and feature selection","volume":"39","author":"Ben-Bassat","year":"1978","journal-title":"Inform. and Control"},{"key":"10.1016\/S0169-7161(82)02038-0_bib7","doi-asserted-by":"crossref","first-page":"324","DOI":"10.1109\/TIT.1978.1055890","article-title":"Renyi's entropy and the probability of error","volume":"24","author":"Ben-Bassat","year":"1978","journal-title":"IEEE Trans. Inform. Theory"},{"key":"10.1016\/S0169-7161(82)02038-0_bib8","doi-asserted-by":"crossref","first-page":"57","DOI":"10.1109\/TPAMI.1980.4766970","article-title":"On the sensitivity of the probability of error rule for feature selection","volume":"2","author":"Ben-Bassat","year":"1980","journal-title":"IEEE Trans. Pattern Anal. Machine Intell."},{"key":"10.1016\/S0169-7161(82)02038-0_bib9","doi-asserted-by":"crossref","first-page":"1054","DOI":"10.1109\/T-C.1971.223402","article-title":"Theoretical comparison of a class of feature selection criteria in pattern recognition","volume":"20","author":"Chen","year":"1971","journal-title":"IEEE Trans. Comput."},{"key":"10.1016\/S0169-7161(82)02038-0_bib10","doi-asserted-by":"crossref","first-page":"159","DOI":"10.1016\/S0020-0255(76)90746-5","article-title":"On information and distance measures, error bounds and feature selection","volume":"10","author":"Chen","year":"1976","journal-title":"Inform. Sci."},{"key":"10.1016\/S0169-7161(82)02038-0_bib11","doi-asserted-by":"crossref","first-page":"116","DOI":"10.1109\/TSMC.1974.5408535","article-title":"The best two independent measurements are not the two best","volume":"4","author":"Cover","year":"1974","journal-title":"IEEE Trans. Systems Man Cybernet."},{"key":"10.1016\/S0169-7161(82)02038-0_bib12","doi-asserted-by":"crossref","first-page":"21","DOI":"10.1109\/TIT.1967.1053964","article-title":"Nearest neighbor pattern classification","volume":"13","author":"Cover","year":"1967","journal-title":"IEEE Trans. Inform. Theory"},{"key":"10.1016\/S0169-7161(82)02038-0_bib13","doi-asserted-by":"crossref","first-page":"657","DOI":"10.1109\/TSMC.1977.4309803","article-title":"On the possible orderings in the measurement selection problem","volume":"7","author":"Cover","year":"1977","journal-title":"IEEE Trans. Systems Man Cybernet."},{"key":"10.1016\/S0169-7161(82)02038-0_bib14","doi-asserted-by":"crossref","first-page":"36","DOI":"10.1016\/S0019-9958(70)80040-7","article-title":"Generalized information functions","volume":"16","author":"Daroczy","year":"1970","journal-title":"Inform. and Control"},{"key":"10.1016\/S0169-7161(82)02038-0_bib15","doi-asserted-by":"crossref","first-page":"404","DOI":"10.1214\/aoms\/1177704567","article-title":"Uncertainty, information and sequential experiments","volume":"33","author":"DeGroot","year":"1962","journal-title":"Ann. Math. Statist."},{"key":"10.1016\/S0169-7161(82)02038-0_bib16","series-title":"Optimal Statistical Decisions","author":"DeGroot","year":"1970"},{"key":"10.1016\/S0169-7161(82)02038-0_bib17","doi-asserted-by":"crossref","first-page":"70","DOI":"10.1109\/T-C.1974.223779","article-title":"On a class of bounds on Bayes risk in multihypothesis pattern recognition","volume":"23","author":"Devijver","year":"1973","journal-title":"IEEE Trans. Comput."},{"key":"10.1016\/S0169-7161(82)02038-0_bib18","doi-asserted-by":"crossref","first-page":"222","DOI":"10.1016\/S0019-9958(77)90294-7","article-title":"Entropies of degree \u03b2 and lower bounds for the average error rate","volume":"34","author":"Devijver","year":"1977","journal-title":"Inform. and Control"},{"key":"10.1016\/S0169-7161(82)02038-0_bib19","series-title":"Proc. Fourth Internat. Joint. Conf. Pattern Recognition","first-page":"217","article-title":"Nonparametric estimation by the method of ordered nearest neighbor sample sets","author":"Devijver","year":"1978"},{"key":"10.1016\/S0169-7161(82)02038-0_bib20","series-title":"Proc. Second Internat. Joint Conf. Pattern Recognition","first-page":"65","article-title":"Some methods for the selection of independent binary features","author":"Duin","year":"1974"},{"key":"10.1016\/S0169-7161(82)02038-0_bib21","doi-asserted-by":"crossref","first-page":"668","DOI":"10.1093\/biomet\/54.3-4.668","article-title":"On the choice of variables in classification problems with dichotomous variables","volume":"54","author":"Elashoff","year":"1971","journal-title":"Biometrika"},{"key":"10.1016\/S0169-7161(82)02038-0_bib22","doi-asserted-by":"crossref","first-page":"33","DOI":"10.1109\/TSSC.1970.300326","article-title":"Feature selection in pattern recognition","volume":"6","author":"Fu","year":"1970","journal-title":"IEEE Trans. Systems Sci. Cybernet."},{"key":"10.1016\/S0169-7161(82)02038-0_bib23","series-title":"Introduction to Statistical Pattern Recognition","author":"Fukunaga","year":"1972"},{"key":"10.1016\/S0169-7161(82)02038-0_bib24","doi-asserted-by":"crossref","first-page":"373","DOI":"10.1007\/BF02479383","article-title":"Separation and probability of correct classification among two or more distributions","volume":"25","author":"Glick","year":"1973","journal-title":"Ann. Inst. Statist. Math."},{"key":"10.1016\/S0169-7161(82)02038-0_bib25","doi-asserted-by":"crossref","first-page":"176","DOI":"10.1055\/s-0038-1636670","article-title":"The diagnostic process with special reference to errors","volume":"10","author":"Good","year":"1971","journal-title":"Math. Inform. Med."},{"key":"10.1016\/S0169-7161(82)02038-0_bib26","doi-asserted-by":"crossref","first-page":"265","DOI":"10.1109\/TIT.1963.1057849","article-title":"Signal selection in communication and radar systems","volume":"9","author":"Greetenberg","year":"1963","journal-title":"IEEE Trans. Inform. Theory"},{"key":"10.1016\/S0169-7161(82)02038-0_bib27","doi-asserted-by":"crossref","DOI":"10.1109\/TIT.1970.1054466","article-title":"Probability of error, equivocation and the Chernoff bound","volume":"16","author":"Hellman","year":"1970","journal-title":"IEEE Trans. Inform. Theory"},{"key":"10.1016\/S0169-7161(82)02038-0_bib28","doi-asserted-by":"crossref","first-page":"763","DOI":"10.1109\/TSMC.1976.4309450","article-title":"On an estimate of the Bhattacharyya distance","volume":"6","author":"Jain","year":"1976","journal-title":"IEEE Trans. Systems Man Cybernet."},{"key":"10.1016\/S0169-7161(82)02038-0_bib29","doi-asserted-by":"crossref","first-page":"52","DOI":"10.1109\/TCOM.1967.1089532","article-title":"The divergence and Bhattacharyya distance in signal selection","volume":"15","author":"Kailath","year":"1967","journal-title":"IEEE Trans. Comm. Tech."},{"key":"10.1016\/S0169-7161(82)02038-0_bib30","doi-asserted-by":"crossref","first-page":"697","DOI":"10.1109\/TIT.1974.1055306","article-title":"Patterns in pattern recognition: 1968\u20131974","volume":"18","author":"Kanal","year":"1974","journal-title":"IEEE Trans. Inform. Theory"},{"key":"10.1016\/S0169-7161(82)02038-0_bib31","doi-asserted-by":"crossref","first-page":"236","DOI":"10.1016\/0047-259X(73)90026-2","article-title":"An axiomatic foundation for a multivariate measure of affinity among a number of distributions","volume":"3","author":"Kaufman","year":"1973","journal-title":"J. Multivariate Anal."},{"key":"10.1016\/S0169-7161(82)02038-0_bib32","doi-asserted-by":"crossref","first-page":"609","DOI":"10.1016\/S0020-7373(75)80023-X","article-title":"Mathematical methods of feature selection in pattern recognition","volume":"7","author":"Kittler","year":"1975","journal-title":"Internat. J. Man-Mach. Stud."},{"key":"10.1016\/S0169-7161(82)02038-0_bib33","doi-asserted-by":"crossref","first-page":"135","DOI":"10.1016\/0020-0190(75)90026-5","article-title":"On the divergence and Joshi dependence measure in feature selection","volume":"3","author":"Kittler","year":"1975","journal-title":"Information Processing Lett."},{"key":"10.1016\/S0169-7161(82)02038-0_bib34","series-title":"Character Readers and Pattern Recognition","article-title":"The problem of character recognition from the point of view of mathematical statistics","author":"Kovalevsky","year":"1968"},{"key":"10.1016\/S0169-7161(82)02038-0_bib35","doi-asserted-by":"crossref","first-page":"79","DOI":"10.1214\/aoms\/1177729694","article-title":"Information and sufficiency","volume":"22","author":"Kullback","year":"1951","journal-title":"Ann. Math. Statist"},{"key":"10.1016\/S0169-7161(82)02038-0_bib36","doi-asserted-by":"crossref","first-page":"730","DOI":"10.1109\/TIT.1969.1054374","article-title":"A class of upper bounds on probability of error for multihypothesis pattern recognition","volume":"15","author":"Lainiotis","year":"1969","journal-title":"IEEE Trans. Inform. Theory"},{"key":"10.1016\/S0169-7161(82)02038-0_bib37","doi-asserted-by":"crossref","first-page":"161","DOI":"10.1109\/TIT.1962.1057691","article-title":"The characteristic selection problem in recognition systems","volume":"8","author":"Lewis","year":"1962","journal-title":"IEEE Trans. Inform. Theory"},{"key":"10.1016\/S0169-7161(82)02038-0_bib38","doi-asserted-by":"crossref","first-page":"986","DOI":"10.1214\/aoms\/1177728069","article-title":"On a measure of the information provided by an experiment","volume":"27","author":"Lindley","year":"1956","journal-title":"Ann. Math. Statist."},{"key":"10.1016\/S0169-7161(82)02038-0_bib39","doi-asserted-by":"crossref","first-page":"34","DOI":"10.1109\/TIT.1976.1055512","article-title":"Error estimation in pattern recognition via L\u03b1-distance between posterior density functions","volume":"22","author":"Lissack","year":"1976","journal-title":"IEEE Trans. Inform. Theory"},{"key":"10.1016\/S0169-7161(82)02038-0_bib40","doi-asserted-by":"crossref","first-page":"11","DOI":"10.1109\/TIT.1963.1057810","article-title":"On the effectiveness of receptors in recognition systems","volume":"9","author":"Marill","year":"1963","journal-title":"IEEE Trans. Inform. Theory"},{"key":"10.1016\/S0169-7161(82)02038-0_bib41","series-title":"Basic Concepts in information Theory and Statistics","author":"Mathai","year":"1975"},{"key":"10.1016\/S0169-7161(82)02038-0_bib42","doi-asserted-by":"crossref","first-page":"181","DOI":"10.1007\/BF02911675","article-title":"On the notion of affinity of several distributions and some of its applications","volume":"19","author":"Matusita","year":"1967","journal-title":"Ann. Inst. Statist. Math."},{"key":"10.1016\/S0169-7161(82)02038-0_bib43","series-title":"Discriminant Analysis and Applications","first-page":"213","article-title":"Discrimination and the affinity of distributions","author":"Matusita","year":"1973"},{"key":"10.1016\/S0169-7161(82)02038-0_bib44","doi-asserted-by":"crossref","first-page":"1023","DOI":"10.1109\/T-C.1971.223398","article-title":"A comparison of seven techniques for choosing subsets of pattern recognition properties","volume":"20","author":"Mucciardi","year":"1971","journal-title":"IEEE Trans. Comput."},{"key":"10.1016\/S0169-7161(82)02038-0_bib45","doi-asserted-by":"crossref","first-page":"917","DOI":"10.1109\/TC.1977.1674939","article-title":"A branch and bound algorithm for feature subset selection","volume":"26","author":"Narendra","year":"1977","journal-title":"IEEE Trans. Comput."},{"key":"10.1016\/S0169-7161(82)02038-0_bib46","doi-asserted-by":"crossref","first-page":"441","DOI":"10.1007\/BF02024507","article-title":"On measures of dependence","volume":"10","author":"Renyi","year":"1959","journal-title":"Acta Math. Acad. Sci. Hungar."},{"key":"10.1016\/S0169-7161(82)02038-0_bib47","first-page":"547","article-title":"On measures of entropy and information","volume":"1","author":"Renyi","year":"1960"},{"key":"10.1016\/S0169-7161(82)02038-0_bib48","first-page":"617","article-title":"On the amount of information concerning an unknown parameter in a sequence of observations","volume":"9","author":"Renyi","year":"1964","journal-title":"Publ. Math. Inst. Hungar. Acad. Sci."},{"key":"10.1016\/S0169-7161(82)02038-0_bib49","series-title":"Research Papers in Statistics","first-page":"281","article-title":"On the amount of missing information and Neyman-Pearson lemma","author":"Renyi","year":"1966"},{"key":"10.1016\/S0169-7161(82)02038-0_bib50","series-title":"Proc. Fifth Berkeley Symposium on Math. Statist","first-page":"531","article-title":"On some problems of statistics from the point of view of information theory","author":"Renyi","year":"1967"},{"key":"10.1016\/S0169-7161(82)02038-0_bib51","first-page":"249","article-title":"Statistics and information theory","volume":"2","author":"Renyi","year":"1967","journal-title":"Studia Sci. Math. Hungar."},{"key":"10.1016\/S0169-7161(82)02038-0_bib52","series-title":"Probability Theory","author":"Renyi","year":"1970"},{"key":"10.1016\/S0169-7161(82)02038-0_bib53","doi-asserted-by":"crossref","first-page":"379","DOI":"10.1002\/j.1538-7305.1948.tb01338.x","article-title":"A mathematical theory of communication","volume":"7","author":"Shannon","year":"1948","journal-title":"Bell Systems Tech. J."},{"key":"10.1016\/S0169-7161(82)02038-0_bib54","doi-asserted-by":"crossref","first-page":"1157","DOI":"10.1214\/aoms\/1177703273","article-title":"On a measure of association","volume":"35","author":"Silvey","year":"1964","journal-title":"Ann. Math. Stat."},{"key":"10.1016\/S0169-7161(82)02038-0_bib55","series-title":"Proc. Third Internat. Joint Conf. Pattern Recognition","first-page":"245","article-title":"On selecting features for pattern recognition","author":"Stearns","year":"1976"},{"key":"10.1016\/S0169-7161(82)02038-0_bib56","doi-asserted-by":"crossref","first-page":"943","DOI":"10.1109\/T-C.1971.223380","article-title":"Some upper bounds on error probability for multiclass pattern recognition","volume":"20","author":"Toussaint","year":"1971","journal-title":"IEEE Trans. Comput."},{"key":"10.1016\/S0169-7161(82)02038-0_bib57","first-page":"618","article-title":"Note on the optimal selection of independent binary valued features for pattern recognition","volume":"17","author":"Toussaint","year":"1971","journal-title":"IEEE Trans. Comput."},{"key":"10.1016\/S0169-7161(82)02038-0_bib58","doi-asserted-by":"crossref","first-page":"153","DOI":"10.1016\/0020-0190(72)90049-X","article-title":"Feature evaluation with quadratic mutual information","volume":"1","author":"Toussaint","year":"1972","journal-title":"Information Processing Lett."},{"key":"10.1016\/S0169-7161(82)02038-0_bib59","series-title":"Proc. Second Internat. Joint Conf. Pattern Recognition","first-page":"479","article-title":"Recent progress in statistical methods applied to pattern recognition","author":"Toussaint","year":"1974"},{"key":"10.1016\/S0169-7161(82)02038-0_bib60","series-title":"Proc. Second Internat. Joint Conf. Pattern Recognition","article-title":"On the divergence between two distributions and the probability of misclassification of several decision rules","author":"Toussaint","year":"1974"},{"key":"10.1016\/S0169-7161(82)02038-0_bib61","series-title":"Proc. Symp. Statist., Related Topics","article-title":"On information transmission, nonparametric classification and measuring dependence between random variables","author":"Toussaint","year":"1974"},{"key":"10.1016\/S0169-7161(82)02038-0_bib62","first-page":"275","article-title":"An upper bound on the probability of misclassification in terms of the affinity","volume":"65","author":"Toussaint","year":"1977"},{"key":"10.1016\/S0169-7161(82)02038-0_bib63","doi-asserted-by":"crossref","first-page":"482","DOI":"10.1109\/TSMC.1978.4310001","article-title":"Probability of error, expected divergence and the affinity of several distributions","volume":"8","author":"Toussaint","year":"1978","journal-title":"IEEE Trans. Systems Man Cybernet."},{"key":"10.1016\/S0169-7161(82)02038-0_bib64","series-title":"Probability of error and equivocation of order \u03b1","author":"Toussaint","year":"1978"},{"key":"10.1016\/S0169-7161(82)02038-0_bib65","first-page":"9","article-title":"Bounds on the minimal error probability and checking a finite or countable number of hypotheses","volume":"4","author":"Vajda","year":"1968","journal-title":"Inform. Transmis. Problems"},{"key":"10.1016\/S0169-7161(82)02038-0_bib66","doi-asserted-by":"crossref","first-page":"381","DOI":"10.1109\/T-C.1973.223725","article-title":"Feature evaluation with measures of probabilistic dependence","volume":"22","author":"Vilmansen","year":"1973","journal-title":"IEEE Trans. Comput."}],"container-title":["Handbook of Statistics","Classification Pattern Recognition and Reduction of Dimensionality"],"original-title":[],"language":"en","deposited":{"date-parts":[[2024,12,31]],"date-time":"2024-12-31T19:31:44Z","timestamp":1735673504000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0169716182020380"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[1982]]},"ISBN":["9780444862174"],"references-count":66,"URL":"https:\/\/doi.org\/10.1016\/s0169-7161(82)02038-0","relation":{},"ISSN":["0169-7161"],"issn-type":[{"value":"0169-7161","type":"print"}],"subject":[],"published":{"date-parts":[[1982]]}}}