{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,17]],"date-time":"2026-01-17T03:34:31Z","timestamp":1768620871337,"version":"3.49.0"},"reference-count":40,"publisher":"Springer Science and Business Media LLC","issue":"1-2","license":[{"start":{"date-parts":[[2011,6,3]],"date-time":"2011-06-03T00:00:00Z","timestamp":1307059200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Mach Learn"],"published-print":{"date-parts":[[2011,10]]},"DOI":"10.1007\/s10994-011-5252-9","type":"journal-article","created":{"date-parts":[[2011,6,3]],"date-time":"2011-06-03T08:03:48Z","timestamp":1307088228000},"page":"77-108","source":"Crossref","is-referenced-by-count":52,"title":["SpicyMKL: a fast algorithm for Multiple Kernel Learning with thousands of kernels"],"prefix":"10.1007","volume":"85","author":[{"given":"Taiji","family":"Suzuki","sequence":"first","affiliation":[]},{"given":"Ryota","family":"Tomioka","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2011,6,3]]},"reference":[{"key":"5252_CR1","doi-asserted-by":"crossref","first-page":"337","DOI":"10.1090\/S0002-9947-1950-0051437-7","volume":"68","author":"N. Aronszajn","year":"1950","unstructured":"Aronszajn, N. (1950). Theory of reproducing kernels. Transactions of the American Mathematical Society, 68, 337\u2013404.","journal-title":"Transactions of the American Mathematical Society"},{"key":"5252_CR2","unstructured":"Asuncion, A., & Newman, D. (2007). UCI machine learning repository. http:\/\/www.ics.uci.edu\/~mlearn\/MLRepository.html ."},{"key":"5252_CR3","first-page":"1179","volume":"9","author":"F. R. Bach","year":"2008","unstructured":"Bach, F. R. (2008). Consistency of the group Lasso and multiple kernel learning. Journal of Machine Learning Research, 9, 1179\u20131225.","journal-title":"Journal of Machine Learning Research"},{"key":"5252_CR4","first-page":"41","volume-title":"Proceedings of the 21st international conference on machine learning","author":"F. R. Bach","year":"2004","unstructured":"Bach, F. R., Lanckriet, G., & Jordan, M. (2004). Multiple kernel learning, conic duality, and the SMO algorithm. In Proceedings of the 21st international conference on machine learning (pp. 41\u201348)."},{"key":"5252_CR5","first-page":"73","volume-title":"Advances in neural information processing systems","author":"F. R. Bach","year":"2005","unstructured":"Bach, F. R., Thibaux, R., & Jordan, M. I. (2005). Computing regularization paths for learning multiple kernels. In Advances in neural information processing systems (Vol. 17, pp. 73\u201380). Cambridge: MIT Press."},{"key":"5252_CR6","volume-title":"Constrained optimization and Lagrange multiplier methods","author":"D. P. Bertsekas","year":"1982","unstructured":"Bertsekas, D. P. (1982). Constrained optimization and Lagrange multiplier methods. New York: Academic Press."},{"key":"5252_CR7","volume-title":"Nonlinear programming","author":"D. P. Bertsekas","year":"1999","unstructured":"Bertsekas, D. P. (1999). Nonlinear programming. Nashua: Athena Scientific."},{"issue":"2","key":"5252_CR8","doi-asserted-by":"crossref","first-page":"489","DOI":"10.1109\/TIT.2005.862083","volume":"52","author":"E. J. Candes","year":"2006","unstructured":"Candes, E. J., Romberg, J., & Tao, T. (2006). Robust uncertainty principles: Exact signal reconstruction from highly incomplete frequency information. IEEE Transactions on Information Theory, 52(2), 489\u2013509.","journal-title":"IEEE Transactions on Information Theory"},{"key":"5252_CR9","volume-title":"NIPS workshop on kernel learning: automatic selection of optimal kernels","author":"O. Chapelle","year":"2008","unstructured":"Chapelle, O., & Rakotomamonjy, A. (2008). Second order optimization of kernel parameters. In NIPS workshop on kernel learning: automatic selection of optimal kernels, Whistler."},{"key":"5252_CR10","doi-asserted-by":"crossref","unstructured":"Cortes, C. (2009). Can learning kernels help performance? Invited talk at International Conference on Machine Learning (ICML 2009), Montr\u00e9al, Canada.","DOI":"10.1145\/1553374.1553538"},{"key":"5252_CR11","volume-title":"Proceedings of the 25th conference on uncertainty in artificial intelligence (UAI 2009)","author":"C. Cortes","year":"2009","unstructured":"Cortes, C., Mohri, M., & Rostamizadeh, A. (2009). L 2 regularization for learning kernels. In Proceedings of the 25th conference on uncertainty in artificial intelligence (UAI 2009), Montr\u00e9al, Canada."},{"key":"5252_CR12","doi-asserted-by":"crossref","first-page":"1413","DOI":"10.1002\/cpa.20042","volume":"LVII","author":"I. Daubechies","year":"2004","unstructured":"Daubechies, I., Defrise, M., & Mol, C. D. (2004). An iterative thresholding algorithm for linear inverse problems with a sparsity constraint. Communications on Pure and Applied Mathematics, LVII, 1413\u20131457.","journal-title":"Communications on Pure and Applied Mathematics"},{"key":"5252_CR13","doi-asserted-by":"crossref","first-page":"906","DOI":"10.1109\/TIP.2003.814255","volume":"12","author":"M. Figueiredo","year":"2003","unstructured":"Figueiredo, M., & Nowak, R. (2003). An EM algorithm for wavelet-based image restoration. IEEE Transactions on Image Processing, 12, 906\u2013916.","journal-title":"IEEE Transactions on Image Processing"},{"key":"5252_CR14","volume-title":"Proceedings of the IEEE computer society conference on computer vision and pattern (CVPR2009)","author":"P. V. Gehler","year":"2009","unstructured":"Gehler, P. V., & Nowozin, S. (2009). Let the kernel figure it out; principled learning of pre-processing for kernel classifiers. In Proceedings of the IEEE computer society conference on computer vision and pattern (CVPR2009)."},{"key":"5252_CR15","doi-asserted-by":"crossref","first-page":"303","DOI":"10.1007\/BF00927673","volume":"4","author":"M. Hestenes","year":"1969","unstructured":"Hestenes, M. (1969). Multiplier and gradient methods. Journal of Optimization Theory and Applications, 4, 303\u2013320.","journal-title":"Journal of Optimization Theory and Applications"},{"key":"5252_CR16","doi-asserted-by":"crossref","first-page":"82","DOI":"10.1016\/0022-247X(71)90184-3","volume":"33","author":"G. S. Kimeldorf","year":"1971","unstructured":"Kimeldorf, G. S., & Wahba, G. (1971). Some results on Tchebycheffian spline functions. Journal of Mathematical Analysis and Applications, 33, 82\u201395.","journal-title":"Journal of Mathematical Analysis and Applications"},{"key":"5252_CR17","first-page":"997","volume-title":"Advances in neural information processing systems","author":"M. Kloft","year":"2009","unstructured":"Kloft, M., Brefeld, U., Sonnenburg, S., Laskov, P., M\u00fcller, K. R., & Zien, A. (2009). Efficient and accurate \u2113 p -norm multiple kernel learning. In Y. Bengio, D. Schuurmans, J. Lafferty, C. K. I. Williams, & A.\u00a0Culotta (Eds.), Advances in neural information processing systems (Vol. 22, pp. 997\u20131005). Cambridge: MIT Press."},{"key":"5252_CR18","unstructured":"Kloft, M., R\u00fcckert, U., & Bartlett, P. L. (2010). A unifying view of multiple kernel learning. arXiv:1005.0437 ."},{"key":"5252_CR19","first-page":"27","volume":"5","author":"G. Lanckriet","year":"2004","unstructured":"Lanckriet, G., Cristianini, N., Ghaoui, L. E., Bartlett, P., & Jordan, M. (2004). Learning the kernel matrix with semi-definite programming. Journal of Machine Learning Research, 5, 27\u201372.","journal-title":"Journal of Machine Learning Research"},{"key":"5252_CR20","first-page":"1099","volume":"6","author":"C. A. Micchelli","year":"2005","unstructured":"Micchelli, C. A., & Pontil, M. (2005). Learning the kernel function via regularization. Journal of Machine Learning Research, 6, 1099\u20131125.","journal-title":"Journal of Machine Learning Research"},{"key":"5252_CR21","volume-title":"NIPS 2008 workshop: kernel learning: automatic selection of optimal kernels","author":"S. Mosci","year":"2008","unstructured":"Mosci, S., Santoro, M., Verri, A., & Villa, S. (2008). A new algorithm to learn an optimal kernel based on Fenchel duality. In NIPS 2008 workshop: kernel learning: automatic selection of optimal kernels, Whistler."},{"key":"5252_CR22","first-page":"844","volume-title":"Advances in neural information processing systems","author":"J. S. Nath","year":"2009","unstructured":"Nath, J. S., Dinesh, G., Raman, S., Bhattacharyya, C., Ben-Tal, A., & Ramakrishnan, K. R. (2009). On the algorithmics and applications of a mixed-norm based kernel learning formulation. In Advances in neural information processing systems (Vol.\u00a022, pp. 844\u2013852). Cambridge: MIT Press."},{"key":"5252_CR23","first-page":"1059","volume-title":"Advances in neural information processing systems","author":"J. Palmer","year":"2006","unstructured":"Palmer, J., Wipf, D., Kreutz-Delgado, K., & Rao, B. (2006). Variational EM algorithms for non-Gaussian latent variable models. In Y. Weiss, B. Sch\u00f6lkopf, & J. Platt (Eds.), Advances in neural information processing systems (Vol.\u00a018, pp. 1059\u20131066). Cambridge: MIT Press."},{"key":"5252_CR24","first-page":"557","volume-title":"Advances in neural information processing systems","author":"J. C. Platt","year":"1999","unstructured":"Platt, J. C. (1999). Using sparseness and analytic QP to speed training of support vector machines. In Advances in neural information processing systems (Vol. 11, pp. 557\u2013563). Cambridge: MIT Press."},{"key":"5252_CR25","first-page":"283","volume-title":"Optimization","author":"M. Powell","year":"1969","unstructured":"Powell, M. (1969). A method for nonlinear constraints in minimization problems. In R. Fletcher (Ed.), Optimization (pp. 283\u2013298). London: Academic Press."},{"key":"5252_CR26","first-page":"2491","volume":"9","author":"A. Rakotomamonjy","year":"2008","unstructured":"Rakotomamonjy, A., Bach, F., & Canu, S. Y. G. (2008). SimpleMKL. Journal of Machine Learning Research, 9, 2491\u20132521.","journal-title":"Journal of Machine Learning Research"},{"issue":"3","key":"5252_CR27","doi-asserted-by":"crossref","first-page":"287","DOI":"10.1023\/A:1007618119488","volume":"42","author":"G. R\u00e4tsch","year":"2001","unstructured":"R\u00e4tsch, G., Onoda, T., & M\u00fcller, K. R. (2001). Soft margins for adaboost. Machine Learning, 42(3), 287\u2013320.","journal-title":"Machine Learning"},{"key":"5252_CR28","doi-asserted-by":"crossref","DOI":"10.1515\/9781400873173","volume-title":"Convex analysis","author":"R. T. Rockafellar","year":"1970","unstructured":"Rockafellar, R. T. (1970). Convex analysis. Princeton: Princeton University Press."},{"key":"5252_CR29","doi-asserted-by":"crossref","first-page":"97","DOI":"10.1287\/moor.1.2.97","volume":"1","author":"R. T. Rockafellar","year":"1976","unstructured":"Rockafellar, R. T. (1976). Augmented Lagrangians and applications of the proximal point algorithm in convex programming. Mathematics of Operations Research, 1, 97\u2013116.","journal-title":"Mathematics of Operations Research"},{"key":"5252_CR30","volume-title":"Learning with kernels","author":"B. Sch\u00f6lkopf","year":"2002","unstructured":"Sch\u00f6lkopf, B., & Smola, A. J. (2002). Learning with kernels. Cambridge: MIT Press."},{"key":"5252_CR31","first-page":"1531","volume":"7","author":"S. Sonnenburg","year":"2006","unstructured":"Sonnenburg, S., R\u00e4tsch, G., Sch\u00e4fer, C., & Sch\u00f6lkopf, B. (2006). Large scale multiple kernel learning. Journal of Machine Learning Research, 7, 1531\u20131565.","journal-title":"Journal of Machine Learning Research"},{"issue":"12","key":"5252_CR32","doi-asserted-by":"crossref","first-page":"1067","DOI":"10.1109\/LSP.2009.2030111","volume":"16","author":"R. Tomioka","year":"2009","unstructured":"Tomioka, R., & Sugiyama, M. (2009). Dual augmented lagrangian method for efficient sparse reconstruction. IEEE Signal Processing Letters, 16(12), 1067\u20131070.","journal-title":"IEEE Signal Processing Letters"},{"key":"5252_CR33","unstructured":"Tomioka, R., & Suzuki, T. (2009). Sparsity-accuracy trade-off in MKL. arXiv:1001.2615 ."},{"key":"5252_CR34","unstructured":"Tomioka, R., & Suzuki, T. (2011). Regularization strategies and empirical Bayesian learning for MKL. arXiv:1011.3090 ."},{"key":"5252_CR35","first-page":"1501","volume":"12","author":"R. Tomioka","year":"2011","unstructured":"Tomioka, R., Suzuki, T., & Sugiyama, M. (2011). Super-linear convergence of dual augmented lagrangian algorithm for sparse learning. Journal of Machine Learning Research, 12, 1501\u20131550.","journal-title":"Journal of Machine Learning Research"},{"issue":"7","key":"5252_CR36","doi-asserted-by":"crossref","first-page":"2479","DOI":"10.1109\/TSP.2009.2016892","volume":"57","author":"S. J. Wright","year":"2009","unstructured":"Wright, S. J., Nowak, R. D., & Figueiredo, M. A. T. (2009). Sparse reconstruction by separable approximation. IEEE Transactions on Signal Processing, 57(7), 2479\u20132493. doi: 10.1109\/TSP.2009.2016892 .","journal-title":"IEEE Transactions on Signal Processing"},{"key":"5252_CR37","first-page":"1825","volume-title":"Advances in neural information processing systems","author":"Z. Xu","year":"2009","unstructured":"Xu, Z., Jin, R., King, I., & Lyu, M. R. (2009). An extended level method for efficient multiple kernel learning. In Advances in neural information processing systems (Vol.\u00a021, pp. 1825\u20131832). Cambridge: MIT Press."},{"issue":"1","key":"5252_CR38","doi-asserted-by":"crossref","first-page":"49","DOI":"10.1111\/j.1467-9868.2005.00532.x","volume":"68","author":"M. Yuan","year":"2006","unstructured":"Yuan, M., & Lin, Y. (2006). Model selection and estimation in regression with grouped variables. Journal of the Royal Statistical Society, Series B, 68(1), 49\u201367.","journal-title":"Journal of the Royal Statistical Society, Series B"},{"key":"5252_CR39","volume-title":"Nonlinear programming: a unified approach","author":"W. I. Zangwill","year":"1969","unstructured":"Zangwill, W. I. (1969). Nonlinear programming: a unified approach. New York: Prentice Hall."},{"key":"5252_CR40","first-page":"11910","volume-title":"Proceedings of the 24th international conference on machine learning","author":"A. Zien","year":"2007","unstructured":"Zien, A., & Ong, C. (2007). Multiclass multiple kernel learning. In Proceedings of the 24th international conference on machine learning (pp. 11910\u20131198). New York: ACM."}],"container-title":["Machine Learning"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10994-011-5252-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10994-011-5252-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10994-011-5252-9","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,6,11]],"date-time":"2019-06-11T10:47:54Z","timestamp":1560250074000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10994-011-5252-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2011,6,3]]},"references-count":40,"journal-issue":{"issue":"1-2","published-print":{"date-parts":[[2011,10]]}},"alternative-id":["5252"],"URL":"https:\/\/doi.org\/10.1007\/s10994-011-5252-9","relation":{},"ISSN":["0885-6125","1573-0565"],"issn-type":[{"value":"0885-6125","type":"print"},{"value":"1573-0565","type":"electronic"}],"subject":[],"published":{"date-parts":[[2011,6,3]]}}}