{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,21]],"date-time":"2026-01-21T15:56:21Z","timestamp":1769010981759,"version":"3.49.0"},"reference-count":196,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"5","license":[{"start":{"date-parts":[[2015,5,1]],"date-time":"2015-05-01T00:00:00Z","timestamp":1430438400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"}],"funder":[{"name":"Stanford Graduate Fellowships"},{"name":"NSF Center for Science of Information","award":["CCF-0939370"],"award-info":[{"award-number":["CCF-0939370"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Inform. Theory"],"published-print":{"date-parts":[[2015,5]]},"DOI":"10.1109\/tit.2015.2412945","type":"journal-article","created":{"date-parts":[[2015,3,13]],"date-time":"2015-03-13T19:16:04Z","timestamp":1426274164000},"page":"2835-2885","source":"Crossref","is-referenced-by-count":136,"title":["Minimax Estimation of Functionals of Discrete Distributions"],"prefix":"10.1109","volume":"61","author":[{"family":"Jiantao Jiao","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kartik","family":"Venkat","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"family":"Yanjun Han","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tsachy","family":"Weissman","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref170","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4614-6660-4"},{"key":"ref172","first-page":"225","article-title":"Aggregation and minimax optimality in high-dimensional estimation","author":"tsybakov","year":"2014","journal-title":"Proc Int Congr Math"},{"key":"ref171","doi-asserted-by":"publisher","DOI":"10.1080\/03610928708829512"},{"key":"ref174","author":"lindvall","year":"2002","journal-title":"Lectures on the Coupling Method"},{"key":"ref173","author":"tsybakov","year":"2008","journal-title":"Introduction to Nonparametric Estimation"},{"key":"ref176","doi-asserted-by":"publisher","DOI":"10.1093\/acprof:oso\/9780199535255.001.0001"},{"key":"ref175","doi-asserted-by":"publisher","DOI":"10.1093\/biomet\/40.3-4.237"},{"key":"ref178","doi-asserted-by":"publisher","DOI":"10.1214\/aop\/1176991794"},{"key":"ref177","article-title":"Beyond maximum likelihood: From theory to practice","author":"jiao","year":"2014"},{"key":"ref168","doi-asserted-by":"publisher","DOI":"10.1090\/S0002-9947-1963-0157165-0"},{"key":"ref169","volume":"232","author":"totik","year":"2013","journal-title":"Polynomial Approximation on Polytopes"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1214\/aos\/1176350051"},{"key":"ref38","first-page":"707","article-title":"The asymptotic minimax risk for the estimation of constrained binomial and multinomial probabilities","volume":"66","author":"braess","year":"2004","journal-title":"Sankhya Indian J Stat"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4612-2618-5_1"},{"key":"ref32","first-page":"638","article-title":"New tricks for old dogs: Large alphabet probability estimation","author":"santhanam","year":"2007","journal-title":"Proc IEEE Inf Theory Workshop (ITW)"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.2307\/2290733"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.2307\/2335721"},{"key":"ref37","author":"chentsov","year":"1982","journal-title":"Statistical Decision Rules and Optimal Inference"},{"key":"ref36","doi-asserted-by":"crossref","DOI":"10.1109\/ISIT.2015.7282680","article-title":"Adaptive estimation of Shannon entropy","author":"han","year":"2015"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1214\/11-STS355"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1080\/01621459.2000.10474329"},{"key":"ref181","article-title":"Structure learning of probabilistic graphical models: A comprehensive survey","author":"zhou","year":"2011"},{"key":"ref180","doi-asserted-by":"publisher","DOI":"10.1214\/aop\/1176988736"},{"key":"ref185","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.1973.1055013"},{"key":"ref184","doi-asserted-by":"publisher","DOI":"10.1155\/2007\/79879"},{"key":"ref183","author":"koller","year":"2009","journal-title":"Probabilistic Graphical Models Principles and Techniques"},{"key":"ref182","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1561\/2200000001","article-title":"Graphical models, exponential families, and variational inference","volume":"1","author":"wainwright","year":"2008","journal-title":"Found Trends Mach Learn"},{"key":"ref189","article-title":"Collected works","volume":"2","author":"bernstein","year":"1964","journal-title":"Izd Akad Nauk SSSR"},{"key":"ref188","doi-asserted-by":"crossref","first-page":"1564","DOI":"10.1214\/aos\/1017939142","article-title":"Information-theoretic determination of minimax rates of convergence","volume":"27","author":"yang","year":"1999","journal-title":"Ann Statist"},{"key":"ref187","doi-asserted-by":"publisher","DOI":"10.1007\/BF01199026"},{"key":"ref186","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2011.2104513"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2004.833360"},{"key":"ref27","article-title":"Minimax rates of entropy estimation on large alphabets via best polynomial approximation","author":"wu","year":"2014"},{"key":"ref179","article-title":"Minimax estimation of discrete distributions under $\\ell _{1}$ loss","author":"han","year":"0"},{"key":"ref29","article-title":"Maximum likelihood estimation of functionals of discrete distributions","author":"jiao","year":"2015"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1016\/j.sigpro.2012.09.003"},{"key":"ref22","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4612-4946-7","author":"le cam","year":"1986","journal-title":"Asymptotic Methods in Statistical Decision Theory"},{"key":"ref21","author":"wald","year":"1950","journal-title":"Statistical Decision Functions"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/1993636.1993727"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511813603"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/FOCS.2011.81"},{"key":"ref25","first-page":"2157","article-title":"Estimating the unseen: Improved estimators for entropy and other properties","author":"valiant","year":"2013","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref50","first-page":"175","article-title":"Local asymptotic minimax and admissibility in estimation","volume":"1","author":"h\u00e1jek","year":"1972","journal-title":"Proc 6th Berkeley Symp Math Statist Probab"},{"key":"ref51","article-title":"On the lower limits of entropy estimation","author":"wyner","year":"0","journal-title":"IEEE Trans Inf Theory"},{"key":"ref154","doi-asserted-by":"publisher","DOI":"10.1214\/aos\/1176345778"},{"key":"ref153","doi-asserted-by":"publisher","DOI":"10.2307\/2337118"},{"key":"ref156","doi-asserted-by":"publisher","DOI":"10.1214\/aoms\/1177731020"},{"key":"ref155","article-title":"Minimax estimation of divergence functions","author":"jiao","year":"0"},{"key":"ref150","article-title":"Maximum likelihood. An introduction","volume":"18","author":"le cam","year":"1979","journal-title":"Lectures Notes"},{"key":"ref152","first-page":"361","article-title":"Estimation with quadratic loss","volume":"1","author":"james","year":"1961","journal-title":"Proc 4th Berkeley Symp Math Statist Probab"},{"key":"ref151","first-page":"197","article-title":"Inadmissibility of the usual estimator for the mean of a multivariate normal distribution","volume":"1","author":"stein","year":"1956","journal-title":"Proc Berkeley Symp on Math Statist and Prob"},{"key":"ref146","doi-asserted-by":"publisher","DOI":"10.1017\/S0305004100009580"},{"key":"ref147","doi-asserted-by":"publisher","DOI":"10.1098\/rspa.1934.0050"},{"key":"ref148","doi-asserted-by":"publisher","DOI":"10.1214\/aos\/1176345003"},{"key":"ref149","doi-asserted-by":"publisher","DOI":"10.1214\/07-STS249"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.2307\/2334280"},{"key":"ref58","article-title":"Does Dirichlet prior smoothing solve the Shannon entropy estimation problem?","author":"han","year":"0"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1088\/0305-4470\/31\/11\/007"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevE.52.6841"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/ISIT.2013.6620615"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1063\/1.166191"},{"key":"ref53","first-page":"95","article-title":"Note on the bias of information estimates","volume":"2","author":"miller","year":"1955","journal-title":"Information Theory in Psychology II-B"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1162\/089976603321780272"},{"key":"ref40","first-page":"1033","article-title":"Variational minimax estimation of discrete distributions under KL Loss","author":"paninski","year":"2004","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref167","author":"bustamante","year":"2011","journal-title":"Algebraic Approximation A Guide to Past and Current Solutions"},{"key":"ref166","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4612-4778-4","author":"ditzian","year":"1987","journal-title":"Moduli of Smoothness"},{"key":"ref165","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9781107325791"},{"key":"ref164","first-page":"429","article-title":"Sur la valeur asymptotique de la meilleure approximation d&#x2019;une fonction ayant un point singulier r&#x00E9;el","volume":"10","author":"ibragimov","year":"1946","journal-title":"Izvestiya Rossiiskoi Akademii Nauk Seriya Matematicheskaya"},{"key":"ref163","first-page":"169","article-title":"The best approximation of $|x|^{p}$ using polynomials of very high degree","volume":"2","author":"bernstein","year":"1938","journal-title":"Bull Russian Acad Sci"},{"key":"ref162","author":"bernstein","year":"1937","journal-title":"Extreme Properties of Polynomials and Best Approximation of Continuous Functions of One Real Variable"},{"key":"ref161","doi-asserted-by":"publisher","DOI":"10.1007\/s10543-009-0240-1"},{"key":"ref160","author":"driscoll","year":"2014","journal-title":"Chebfun Guide"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ISIT.2014.6875283"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/18.370121"},{"key":"ref6","author":"breiman","year":"1984","journal-title":"Classification and Regression Trees"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ISIT.2014.6875284"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/2.36"},{"key":"ref159","first-page":"41","article-title":"Sur la d&#x00E9;termination des polyn&#x00F4;mes d&#x2019;approximation de degr&#x00E9; donn&#x00E9;e","volume":"10","author":"remez","year":"1934","journal-title":"Commun Soc Math Kharkov"},{"key":"ref7","volume":"31","author":"lehmann","year":"1998","journal-title":"Theory of Point Estimation"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1007\/BF00533669"},{"key":"ref157","first-page":"303","article-title":"Unbiased estimates","volume":"14","author":"kolmogorov","year":"1950","journal-title":"Izvestiya Rossiiskoi Akademii Nauk Seriya Matematicheskaya"},{"key":"ref9","volume":"1","author":"quinlan","year":"1993","journal-title":"C4 5 Programs for Machine Learning"},{"key":"ref158","doi-asserted-by":"publisher","DOI":"10.1007\/978-94-011-1970-2"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/ISIT.2013.6620525"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2010.2043769"},{"key":"ref48","volume":"3","author":"van der vaart","year":"2000","journal-title":"Asymptotic Statistics"},{"key":"ref47","article-title":"The complexity of estimating R&#x00E9;nyi entropy","author":"acharya","year":"2014"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2012.2195769"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2004.834734"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevX.1.011008"},{"key":"ref43","doi-asserted-by":"crossref","first-page":"1018","DOI":"10.1126\/science.1177170","article-title":"Limits of predictability in human mobility","volume":"327","author":"song","year":"2010","journal-title":"Science"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-662-02888-9"},{"key":"ref72","doi-asserted-by":"crossref","DOI":"10.2307\/j.ctvc773pk","author":"p\u00f3lya","year":"2014","journal-title":"How to Solve It&#x2014;A New Aspect of Mathematical Method"},{"key":"ref71","article-title":"Algorithmic approaches to statistical questions","author":"valiant","year":"2012"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevE.85.051139"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1007\/s004409970006"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1214\/10-AOS849"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.1137\/1131054"},{"key":"ref75","volume":"1738","author":"nemirovski","year":"2000","journal-title":"Topics in Non-Parametric Statistics"},{"key":"ref78","first-page":"1","article-title":"Strong uniqueness","volume":"5","author":"kro\u00f3","year":"2010","journal-title":"Surveys Approx Theory"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4899-0027-2"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1037\/h0026857"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.2307\/1936227"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1016\/0375-9601(88)90193-4"},{"key":"ref63","first-page":"1469","article-title":"Entropy inference and the James&#x2013;Stein estimator, with application to nonlinear gene association networks","volume":"10","author":"hausser","year":"2009","journal-title":"The Journal of Machine Learning Research archive"},{"key":"ref64","first-page":"471","article-title":"Entropy and inference, revisited","volume":"1","author":"nemenman","year":"2002","journal-title":"Advances in neural information processing systems"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1023\/A:1026096204727"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1186\/1471-2105-5-118"},{"key":"ref67","article-title":"Entropy estimates from insufficient samplings","author":"grassberger","year":"2008"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.3390\/e13122013"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevE.69.056111"},{"key":"ref193","doi-asserted-by":"publisher","DOI":"10.1016\/S0021-9800(69)80045-1"},{"key":"ref194","volume":"1","author":"bernstein","year":"1958","journal-title":"Collected Works Constructive Theory of Functions (1905&#x2013;1930)"},{"key":"ref195","first-page":"449","article-title":"Some coefficient estimates for polynomials on the unit interval","volume":"33","author":"qazi","year":"2007","journal-title":"Serdica Math J"},{"key":"ref196","doi-asserted-by":"publisher","DOI":"10.1214\/aoms\/1177732430"},{"key":"ref95","doi-asserted-by":"publisher","DOI":"10.3103\/S1066530712030027"},{"key":"ref94","doi-asserted-by":"publisher","DOI":"10.1214\/08-AOS654"},{"key":"ref190","doi-asserted-by":"publisher","DOI":"10.1007\/BF01890040"},{"key":"ref93","doi-asserted-by":"crossref","first-page":"341","DOI":"10.3150\/bj\/1116340298","article-title":"Adaptive estimation of linear functionals under different performance measures","volume":"11","author":"cai","year":"2005","journal-title":"Bernoulli"},{"key":"ref191","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511813603"},{"key":"ref92","doi-asserted-by":"publisher","DOI":"10.1214\/009053605000000633"},{"key":"ref192","year":"2013","journal-title":"Mathematica"},{"key":"ref91","doi-asserted-by":"crossref","first-page":"552","DOI":"10.1214\/009053604000000094","article-title":"Minimax estimation of linear functionals over nonconvex parameter spaces","volume":"32","author":"cai","year":"2004","journal-title":"Ann Statist"},{"key":"ref90","doi-asserted-by":"crossref","first-page":"1140","DOI":"10.1214\/aos\/1059655908","article-title":"A note on nonparametric estimation of linear functionals","volume":"31","author":"cai","year":"2003","journal-title":"Ann Statist"},{"key":"ref98","doi-asserted-by":"publisher","DOI":"10.1016\/0167-7152(87)90083-6"},{"key":"ref99","first-page":"381","article-title":"Estimating integrated squared density derivatives: Sharp best order of convergence estimates","volume":"50","author":"bickel","year":"1988","journal-title":"Sankhy? Indian J Statist Ser A (1961&#x2013;2002)"},{"key":"ref96","first-page":"65","article-title":"Asymptotically efficient estimation of nonlinear functionals","volume":"14","author":"levit","year":"1978","journal-title":"Problemy Peredachi Inf"},{"key":"ref97","first-page":"41","article-title":"On the nonparametric estimation of functionals","author":"ibragimov","year":"1978","journal-title":"Symp Asympt Statist"},{"key":"ref82","first-page":"738","article-title":"On efficiency of a class of non-parametric estimates","volume":"20","author":"levit","year":"1975","journal-title":"Teor Veroyatnost r Primenen"},{"key":"ref81","first-page":"215","article-title":"On optimality of some statistical estimates","volume":"2","author":"levit","year":"1974","journal-title":"Proc Prague Symp Asymptotic Statist"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1137\/1132002"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.1137\/1121087"},{"key":"ref80","doi-asserted-by":"crossref","first-page":"1769","DOI":"10.3982\/ECTA8681","article-title":"Impossibility results for nondifferentiable functionals","volume":"80","author":"hirano","year":"2012","journal-title":"Econometrica"},{"key":"ref89","doi-asserted-by":"crossref","first-page":"1567","DOI":"10.1214\/aos\/1015345955","article-title":"Sharp adaptive estimation of linear functionals","volume":"29","author":"klemel\u00e4","year":"2001","journal-title":"Ann Statist"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.1214\/aos\/1176348114"},{"key":"ref86","doi-asserted-by":"publisher","DOI":"10.1214\/aos\/1176348115"},{"key":"ref87","doi-asserted-by":"publisher","DOI":"10.1214\/aos\/1176325367"},{"key":"ref88","doi-asserted-by":"publisher","DOI":"10.1007\/s440-000-8013-3"},{"key":"ref101","doi-asserted-by":"publisher","DOI":"10.1214\/aos\/1176348249"},{"key":"ref100","doi-asserted-by":"publisher","DOI":"10.1016\/0885-064X(90)90025-9"},{"key":"ref127","doi-asserted-by":"publisher","DOI":"10.1109\/18.45281"},{"key":"ref126","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.1978.1055934"},{"key":"ref125","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.1977.1055714"},{"key":"ref124","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.1978.1055912"},{"key":"ref129","doi-asserted-by":"publisher","DOI":"10.1109\/ITW.2005.1531895"},{"key":"ref128","doi-asserted-by":"publisher","DOI":"10.1109\/18.669425"},{"key":"ref130","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2013.2267934"},{"key":"ref133","doi-asserted-by":"publisher","DOI":"10.1006\/jmva.1999.1873"},{"key":"ref134","author":"serdobolskii","year":"2007","journal-title":"Multiparametric Statistics"},{"key":"ref131","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2006.885507"},{"key":"ref132","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2006.871582"},{"key":"ref136","doi-asserted-by":"publisher","DOI":"10.1214\/12-AOS1054"},{"key":"ref135","doi-asserted-by":"publisher","DOI":"10.1214\/08-EJS262"},{"key":"ref138","doi-asserted-by":"publisher","DOI":"10.1145\/1968.1972"},{"key":"ref137","article-title":"Bernstein&#x2013;von Mises theorem for growing parameter dimension","author":"spokoiny","year":"2013"},{"key":"ref139","doi-asserted-by":"crossref","DOI":"10.1007\/0-387-34239-7","author":"vapnik","year":"2006","journal-title":"Estimation of Dependences Based on Empirical Data"},{"key":"ref140","volume":"2","author":"vapnik","year":"1998","journal-title":"Statistical Learning Theory"},{"key":"ref141","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2004.830761"},{"key":"ref142","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2011.2137210"},{"key":"ref143","doi-asserted-by":"publisher","DOI":"10.1109\/Allerton.2011.6120392"},{"key":"ref2","first-page":"547","article-title":"On measures of entropy and information","author":"r\u00e9nyi","year":"1961","journal-title":"Proc 4th Berkeley Symp Math Statist Probab"},{"key":"ref144","article-title":"Large alphabet compression and predictive distributions through poissonization and tilting","author":"yang","year":"2013"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1002\/j.1538-7305.1948.tb01338.x"},{"key":"ref145","doi-asserted-by":"publisher","DOI":"10.1098\/rsta.1922.0009"},{"key":"ref109","first-page":"75","article-title":"Root- $n$ consistent estimators of entropy for densities with unbounded support","volume":"23","author":"tsybakov","year":"1996","journal-title":"Scandinavian Journal of Statistics"},{"key":"ref108","doi-asserted-by":"publisher","DOI":"10.1007\/BF00773669"},{"key":"ref107","doi-asserted-by":"publisher","DOI":"10.1214\/009053606000000849"},{"key":"ref106","doi-asserted-by":"publisher","DOI":"10.1214\/009053605000000147"},{"key":"ref105","doi-asserted-by":"crossref","first-page":"1302","DOI":"10.1214\/aos\/1015957395","article-title":"Adaptive estimation of a quadratic functional by model selection","volume":"28","author":"laurent","year":"2000","journal-title":"Ann Statist"},{"key":"ref104","doi-asserted-by":"publisher","DOI":"10.1137\/1140012"},{"key":"ref103","doi-asserted-by":"publisher","DOI":"10.1214\/aos\/1176324452"},{"key":"ref102","doi-asserted-by":"crossref","first-page":"682","DOI":"10.1214\/aos\/1032894459","article-title":"On Bickel and Ritov&#x2019;s conjecture about adaptive estimation of the integral of the square of density derivative","volume":"24","author":"efromovich","year":"1996","journal-title":"Ann Statist"},{"key":"ref111","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2002.1028355"},{"key":"ref112","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevE.66.051903"},{"key":"ref110","first-page":"17","article-title":"Nonparametric entropy estimation: An overview","volume":"6","author":"beirlant","year":"1997","journal-title":"Int J Math Statist Sci"},{"key":"ref10","first-page":"297","article-title":"Improved information gain estimates for decision tree induction","author":"nowozin","year":"2012","journal-title":"Proc 29th Int Conf Mach Learn (ICML)"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.1968.1054142"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ISIT.2014.6874972"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1155\/2009\/308959"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TMI.2003.815867"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1023\/A:1007958904918"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/s00145-010-9084-8"},{"key":"ref118","first-page":"2537","article-title":"Exponential concentration for mutual information estimation with application to forests","author":"liu","year":"2012","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.2307\/1934352"},{"key":"ref117","doi-asserted-by":"publisher","DOI":"10.1214\/11-EJS614"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1088\/1751-8113\/41\/2\/025302"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-12465-5_10"},{"key":"ref119","doi-asserted-by":"publisher","DOI":"10.1002\/rsa.10019"},{"key":"ref114","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2008.928251"},{"key":"ref113","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevE.69.066138"},{"key":"ref116","doi-asserted-by":"crossref","first-page":"265","DOI":"10.1561\/0100000021","article-title":"Universal estimation of information measures for analog sources","volume":"5","author":"wang","year":"2009","journal-title":"Found Trends Commun Inf Theory"},{"key":"ref115","doi-asserted-by":"publisher","DOI":"10.3103\/S106653070803006X"},{"key":"ref120","doi-asserted-by":"publisher","DOI":"10.1002\/sim.2942"},{"key":"ref121","doi-asserted-by":"publisher","DOI":"10.1162\/NECO_a_00266"},{"key":"ref122","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2012.2217393"},{"key":"ref123","doi-asserted-by":"publisher","DOI":"10.1002\/j.1538-7305.1951.tb01366.x"}],"container-title":["IEEE Transactions on Information Theory"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/18\/7088688\/07060676.pdf?arnumber=7060676","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,2]],"date-time":"2022-05-02T16:17:53Z","timestamp":1651508273000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7060676\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,5]]},"references-count":196,"journal-issue":{"issue":"5"},"URL":"https:\/\/doi.org\/10.1109\/tit.2015.2412945","relation":{},"ISSN":["0018-9448","1557-9654"],"issn-type":[{"value":"0018-9448","type":"print"},{"value":"1557-9654","type":"electronic"}],"subject":[],"published":{"date-parts":[[2015,5]]}}}