{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,13]],"date-time":"2025-10-13T19:30:46Z","timestamp":1760383846408,"version":"3.41.2"},"reference-count":40,"publisher":"Springer Science and Business Media LLC","issue":"1-3","license":[{"start":{"date-parts":[[2002,7,1]],"date-time":"2002-07-01T00:00:00Z","timestamp":1025481600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2002,7,1]],"date-time":"2002-07-01T00:00:00Z","timestamp":1025481600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Machine Learning"],"published-print":{"date-parts":[[2002,7]]},"DOI":"10.1023\/a:1013947519741","type":"journal-article","created":{"date-parts":[[2002,12,28]],"date-time":"2002-12-28T13:55:48Z","timestamp":1041083748000},"page":"51-84","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":17,"title":["Metric-Based Methods for Adaptive Model Selection and Regularization"],"prefix":"10.1007","volume":"48","author":[{"given":"Dale","family":"Schuurmans","sequence":"first","affiliation":[]},{"given":"Finnegan","family":"Southey","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"393391_CR1","doi-asserted-by":"crossref","first-page":"203","DOI":"10.1007\/BF02506337","volume":"22","author":"H. Akaike","year":"1970","unstructured":"Akaike, H. (1970). Statistical predictor information. Annals of the Institute of Statistical Mathematics, 22, 203\u2013271.","journal-title":"Annals of the Institute of Statistical Mathematics"},{"key":"393391_CR2","doi-asserted-by":"crossref","first-page":"716","DOI":"10.1109\/TAC.1974.1100705","volume":"19","author":"H. Akaike","year":"1974","unstructured":"Akaike, H. (1974). A new look at the statistical model identification. IEEE Transactions on Automatic Control, 19, 716\u2013723.","journal-title":"IEEE Transactions on Automatic Control"},{"key":"393391_CR3","doi-asserted-by":"crossref","DOI":"10.1017\/CBO9780511624216","volume-title":"Neural network learning: Theoretical foundations","author":"M. Anthony","year":"1999","unstructured":"Anthony, M., & Bartlett, P. (1999). Neural network learning: Theoretical foundations. Cambridge: Cambridge University Press."},{"key":"393391_CR4","doi-asserted-by":"crossref","DOI":"10.1093\/oso\/9780198538493.001.0001","volume-title":"Neural networks for pattern recognition","author":"C. Bishop","year":"1995","unstructured":"Bishop, C. (1995). Neural networks for pattern recognition. Oxford: Clarendon Press."},{"key":"393391_CR5","first-page":"92","volume":"COLT-98","author":"A. Blum","year":"1998","unstructured":"Blum, A., & Mitchell, T. (1998). Combining labeled and unlabeled data with co-training. In Proceedings Annual Conference on Computational Learning Theory, COLT-98 (pp. 92\u2013100).","journal-title":"Proceedings Annual Conference on Computational Learning Theory"},{"key":"393391_CR6","doi-asserted-by":"crossref","first-page":"123","DOI":"10.1023\/A:1018054314350","volume":"24","author":"L. Breiman","year":"1996","unstructured":"Breiman, L. (1996). Bagging predictors. Machine Learning, 24, 123\u2013140.","journal-title":"Machine Learning"},{"issue":"6","key":"393391_CR7","doi-asserted-by":"crossref","first-page":"2102","DOI":"10.1109\/18.556600","volume":"42","author":"V. Castelli","year":"1996","unstructured":"Castelli, V., & Cover, T. (1996). The relative value of labeled and unlabeled samples in pattern recognition with an unknown mixing parameter. IEEE Transactions on Information Theory, 42:6, 2102\u20132117.","journal-title":"IEEE Transactions on Information Theory"},{"key":"393391_CR8","volume-title":"Learning from data: Concepts, theory, and methods","author":"V. Cherkassky","year":"1998","unstructured":"Cherkassky, V., & Mulier, F. (1998). Learning from data: Concepts, theory, and methods. New York: Wiley."},{"unstructured":"Cherkassky, V., Mulier, F., & Vapnik, V. (1997). Comparison of VC-method with classical methods for model selection. In Proceedings World Congress on Neural Networks (pp. 957-962).","key":"393391_CR9"},{"key":"393391_CR10","volume-title":"Elements of information theory","author":"T. Cover","year":"1991","unstructured":"Cover, T., & Thomas, J. (1991). Elements of information theory. New York: Wiley."},{"key":"393391_CR11","doi-asserted-by":"crossref","first-page":"377","DOI":"10.1007\/BF01404567","volume":"31","author":"P. Craven","year":"1979","unstructured":"Craven, P., & Wahba, G. (1979). Smoothing noisy data with spline functions. Numerische Mathematik, 31, 377\u2013403.","journal-title":"Numerische Mathematik"},{"key":"393391_CR12","doi-asserted-by":"crossref","first-page":"460","DOI":"10.1137\/1021092","volume":"21","author":"B. Efron","year":"1979","unstructured":"Efron, B. (1979). Computers and the theory of statistics: Thinking the unthinkable. SIAM Review, 21, 460\u2013480.","journal-title":"SIAM Review"},{"key":"393391_CR13","doi-asserted-by":"crossref","first-page":"1947","DOI":"10.1214\/aos\/1176325766","volume":"22","author":"D. Foster","year":"1994","unstructured":"Foster, D., & George, E. (1994). The risk inflation criterion for multiple regression. Annals of Statistics, 22, 1947\u20131975.","journal-title":"Annals of Statistics"},{"issue":"1","key":"393391_CR14","doi-asserted-by":"crossref","first-page":"119","DOI":"10.1006\/jcss.1997.1504","volume":"55","author":"Y. Freund","year":"1997","unstructured":"Freund, Y., & Schapire, R. (1997). A decision-theoretic generalization of on-line learning and an application to boosting. Journal of Computer and System Sciences, 55:1, 119\u2013139.","journal-title":"Journal of Computer and System Sciences"},{"unstructured":"Galarza, C., Rietman, E., & Vapnik, V. (1996). Applications of model selection techniques to polynomial approximation. Preprint.","key":"393391_CR15"},{"issue":"6","key":"393391_CR16","doi-asserted-by":"crossref","first-page":"552","DOI":"10.1109\/34.87342","volume":"13","author":"D. Gutfinger","year":"1991","unstructured":"Gutfinger, D., & Sklansky, J. (1991). Robust classifiers by mixed adaptation. IEEE Transactions onPattern Analysis and Machine Intelligence, 13:6, 552\u2013567.","journal-title":"IEEE Transactions onPattern Analysis and Machine Intelligence"},{"unstructured":"Heckerman, D., & Chickering, D. (1996). A comparison of scientific and engineering criteria for Bayesian model selection. Technical Report MSR-TR-96-12, Microsoft Research.","key":"393391_CR17"},{"unstructured":"Kohavi, R. (1995). A study of cross-validation and bootstrap for accuracy estimation and model selection. In Proceedings of International Joint Conference on Artificial Intelligence, IJCAI-95.","key":"393391_CR18"},{"key":"393391_CR19","first-page":"231","volume":"7","author":"A. Krogh","year":"1995","unstructured":"Krogh, A., & Vedelsby, J. (1995). Neural network ensembles, cross validation, and active learning. In Advances in neural information processing systems 7 (pp. 231\u2013238).","journal-title":"Advances in neural information processing systems"},{"key":"393391_CR20","doi-asserted-by":"crossref","first-page":"51","DOI":"10.1145\/238061.238068","volume":"COLT-96","author":"G. Lugosi","year":"1996","unstructured":"Lugosi, G., & Pinter, M. (1996). A data-dependent skeleton estimate for learning. In Proceedings Annual Conference on Computational Learning Theory, COLT-96 (pp. 51\u201356).","journal-title":"Proceedings Annual Conference on Computational Learning Theory"},{"key":"393391_CR21","doi-asserted-by":"crossref","first-page":"415","DOI":"10.1162\/neco.1992.4.3.415","volume":"4","author":"D. MacKay","year":"1992","unstructured":"MacKay, D. (1992). Bayesian interpolation. Neural Computation, 4, 415\u2013447.","journal-title":"Neural Computation"},{"key":"393391_CR22","first-page":"661","volume":"15","author":"C. Mallows","year":"1973","unstructured":"Mallows, C. (1973). Some comments on Cp. Technometrics, 15, 661\u2013676.","journal-title":"Technometrics"},{"key":"393391_CR23","first-page":"571","volume":"9","author":"D. Miller","year":"1997","unstructured":"Miller, D., & Uyar, H. (1997). A mixture of experts classifier with learning based on both labelled and unlabelled data. In Advances in neural information processing systems 9 (pp. 571\u2013577).","journal-title":"Advances in neural information processing systems"},{"issue":"364","key":"393391_CR24","doi-asserted-by":"crossref","first-page":"821","DOI":"10.1080\/01621459.1978.10480106","volume":"73","author":"T. O'Neill","year":"1978","unstructured":"O'Neill, T. (1978). Normal discrimination with unclassified observations. Journal of the American Statistical Association, 73:364, 821\u2013826.","journal-title":"Journal of the American Statistical Association"},{"doi-asserted-by":"crossref","unstructured":"Opitz, D., & Shavlik, J. (1996). Generating accurate and diverse members of a neural-network ensemble. In Advances in neural information processing systems 8.","key":"393391_CR25","DOI":"10.1080\/095400996116802"},{"key":"393391_CR26","doi-asserted-by":"crossref","first-page":"978","DOI":"10.1126\/science.247.4945.978","volume":"247","author":"T. Poggio","year":"1990","unstructured":"Poggio, T., & Girosi, F. (1990). Regularization algorithms for learning that are equivalent to multilayer networks. Science, 247, 978\u2013982.","journal-title":"Science"},{"key":"393391_CR27","first-page":"412","volume":"COLT-95","author":"J. Ratsaby","year":"1995","unstructured":"Ratsaby, J., & Venkatesh, S. (1995). Learning from a mixture of labeled and unlabeled examples with parametric side information. In Proceedings of Annual Conference on Computational Learning Theory, COLT-95 (pp. 412\u2013417).","journal-title":"Proceedings of Annual Conference on Computational Learning Theory"},{"key":"393391_CR28","doi-asserted-by":"crossref","DOI":"10.1017\/CBO9780511812651","volume-title":"Pattern recognition and neural networks","author":"B. Ripley","year":"1996","unstructured":"Ripley, B. (1996). Pattern recognition and neural networks. Cambridge: Cambridge University Press."},{"key":"393391_CR29","doi-asserted-by":"crossref","first-page":"1080","DOI":"10.1214\/aos\/1176350051","volume":"14","author":"J. Rissanen","year":"1986","unstructured":"Rissanen, J. (1986). Stochastic complexity and modeling. Annals of Statistics, 14, 1080\u20131100.","journal-title":"Annals of Statistics"},{"issue":"2","key":"393391_CR30","first-page":"153","volume":"10","author":"C. Schaffer","year":"1993","unstructured":"Schaffer, C. (1993). Overfitting avoidance as bias. Machine Learning, 10:2, 153\u2013178.","journal-title":"Machine Learning"},{"key":"393391_CR31","first-page":"683","volume":"ICML-94","author":"C. Schaffer","year":"1994","unstructured":"Schaffer,C. (1994).A conservation lawfor generalization performance. In Proceedings of International Conference on Machine Learning, ICML-94 (pp. 683\u2013690).","journal-title":"Proceedings of International Conference on Machine Learning"},{"key":"393391_CR32","first-page":"552","volume":"AAAI-97","author":"D. Schuurmans","year":"1997","unstructured":"Schuurmans, D. (1997). A new metric-based approach to model selection. In Proceedings of National Conference on Artificial Intelligence, AAAI-97 (pp. 552\u2013558).","journal-title":"Proceedings of National Conference on Artificial Intelligence"},{"key":"393391_CR33","first-page":"847","volume":"ICML-2000","author":"D. Schuurmans","year":"2000","unstructured":"Schuurmans, D., & Southey, F. (2000). An adaptive regularization criterion for supervised learning. In Proceedings of International Conference on Machine Learning, ICML-2000 (pp. 847\u2013854).","journal-title":"Proceedings of International Conference on Machine Learning"},{"key":"393391_CR34","first-page":"340","volume":"ICML-97","author":"D. Schuurmans","year":"1997","unstructured":"Schuurmans, D., Ungar, L., & Foster, D. (1997). Characterizing the generalization performance of model selection strategies. In Proceedings of International Conference on Machine Learning, ICML-97 (pp. 340\u2013348).","journal-title":"Proceedings of International Conference on Machine Learning"},{"key":"393391_CR35","doi-asserted-by":"crossref","first-page":"461","DOI":"10.1214\/aos\/1176344136","volume":"6","author":"G. Schwarz","year":"1978","unstructured":"Schwarz, G. (1978). Estimating the dimension of a model. Annals of Statistics, 6, 461\u2013464.","journal-title":"Annals of Statistics"},{"key":"393391_CR36","doi-asserted-by":"crossref","first-page":"45","DOI":"10.1093\/biomet\/68.1.45","volume":"68","author":"R. Shibata","year":"1981","unstructured":"Shibata, R. (1981). An optimal selection of regression variables. Biometrika, 68, 45\u201354.","journal-title":"Biometrika"},{"key":"393391_CR37","first-page":"647","volume":"8","author":"G. Towell","year":"1996","unstructured":"Towell, G. (1996). Using unlabeled data for supervised learning. In Advances in neural information processing systems 8 (pp. 647\u2013653).","journal-title":"Advances in neural information processing systems"},{"key":"393391_CR38","volume-title":"The nature of statistical learning theory","author":"V. Vapnik","year":"1996","unstructured":"Vapnik, V. (1996). The nature of statistical learning theory. New York: Springer-Verlag."},{"key":"393391_CR39","volume-title":"Computer systems that learn","author":"S. M. Weiss","year":"1991","unstructured":"Weiss, S. M., & Kulikowski, C. A. (1991). Computer systems that learn. San Mateo: Morgan Kaufmann."},{"issue":"2","key":"393391_CR40","doi-asserted-by":"crossref","first-page":"309","DOI":"10.1093\/biomet\/64.2.309","volume":"64","author":"A. Young","year":"1977","unstructured":"Young, A. (1977). A Bayesian approach to prediction using polynomials. Biometrika, 64:2, 309\u2013317.","journal-title":"Biometrika"}],"container-title":["Machine Learning"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1023\/A:1013947519741.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1023\/A:1013947519741\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1023\/A:1013947519741.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,10]],"date-time":"2025-07-10T11:37:18Z","timestamp":1752147438000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1023\/A:1013947519741"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2002,7]]},"references-count":40,"journal-issue":{"issue":"1-3","published-print":{"date-parts":[[2002,7]]}},"alternative-id":["393391"],"URL":"https:\/\/doi.org\/10.1023\/a:1013947519741","relation":{},"ISSN":["0885-6125","1573-0565"],"issn-type":[{"type":"print","value":"0885-6125"},{"type":"electronic","value":"1573-0565"}],"subject":[],"published":{"date-parts":[[2002,7]]},"assertion":[{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}