{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,29]],"date-time":"2025-09-29T07:47:48Z","timestamp":1759132068350,"version":"3.40.3"},"publisher-location":"Cham","reference-count":31,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319712482"},{"type":"electronic","value":"9783319712499"}],"license":[{"start":{"date-parts":[[2017,1,1]],"date-time":"2017-01-01T00:00:00Z","timestamp":1483228800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2017,1,1]],"date-time":"2017-01-01T00:00:00Z","timestamp":1483228800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017]]},"DOI":"10.1007\/978-3-319-71249-9_27","type":"book-chapter","created":{"date-parts":[[2017,12,29]],"date-time":"2017-12-29T08:53:43Z","timestamp":1514537623000},"page":"445-459","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Crossprop: Learning Representations by Stochastic Meta-Gradient Descent in Neural Networks"],"prefix":"10.1007","author":[{"given":"Vivek","family":"Veeriah","sequence":"first","affiliation":[]},{"given":"Shangtong","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Richard S.","family":"Sutton","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2017,12,30]]},"reference":[{"key":"27_CR1","unstructured":"Bahdanau, D., Cho, K., Bengio, Y.: Neural machine translation by jointly learning to align and translate (2014). arXiv preprint arXiv:1409.0473"},{"key":"27_CR2","doi-asserted-by":"crossref","first-page":"253","DOI":"10.1613\/jair.3912","volume":"47","author":"MG Bellemare","year":"2013","unstructured":"Bellemare, M.G., Naddaf, Y., Veness, J., Bowling, M.: The arcade learning environment: an evaluation platform for general agents. J. Artif. Intell. Res. (JAIR) 47, 253\u2013279 (2013)","journal-title":"J. Artif. Intell. Res. (JAIR)"},{"key":"27_CR3","doi-asserted-by":"crossref","unstructured":"Cho, K., Van Merrinboer, B., Gulcehre, C., Bahdanau, D., Bougares, F., Schwenk, H., Bengio, Y.: Learning phrase representations using RNN encoder-decoder for statistical machine translation (2014). arXiv preprint arXiv:1406.1078","DOI":"10.3115\/v1\/D14-1179"},{"key":"27_CR4","series-title":"LNCS","doi-asserted-by":"publisher","first-page":"561","DOI":"10.1007\/978-3-642-35289-8_30","volume-title":"Neural Networks: Tricks of the Trade","author":"A Coates","year":"2012","unstructured":"Coates, A., Ng, A.Y.: Learning feature representations with K-means. In: Montavon, G., Orr, G.B., M\u00fcller, K.-R. (eds.) Neural Networks: Tricks of the Trade. LNCS, vol. 7700, pp. 561\u2013580. Springer, Heidelberg (2012). https:\/\/doi.org\/10.1007\/978-3-642-35289-8_30"},{"issue":"3","key":"27_CR5","doi-asserted-by":"publisher","first-page":"287","DOI":"10.1016\/0165-1684(94)90029-9","volume":"36","author":"P Comon","year":"1994","unstructured":"Comon, P.: Independent component analysis, a new concept? Sig. process. 36(3), 287\u2013314 (1994)","journal-title":"Sig. process."},{"key":"27_CR6","doi-asserted-by":"crossref","unstructured":"Deng, J., Dong, W., Socher, R., Li, L.J., Li, K., Fei-Fei, L.: Imagenet: a large-scale hierarchical image database. In: 2009 IEEE Conference on Computer Vision and Pattern Recognition, CVPR 2009, pp. 248\u2013255. IEEE, June 2009","DOI":"10.1109\/CVPR.2009.5206848"},{"issue":"4","key":"27_CR7","doi-asserted-by":"publisher","first-page":"295","DOI":"10.1016\/0893-6080(88)90003-2","volume":"1","author":"RA Jacobs","year":"1988","unstructured":"Jacobs, R.A.: Increased rates of convergence through learning rate adaptation. Neural Netw. 1(4), 295\u2013307 (1988)","journal-title":"Neural Netw."},{"key":"27_CR8","unstructured":"Kingma, D., Ba, J.: Adam: a method for stochastic optimization (2014). arXiv preprint arXiv:1412.6980"},{"key":"27_CR9","doi-asserted-by":"crossref","unstructured":"Kirkpatrick, J., Pascanu, R., Rabinowitz, N., Veness, J., Desjardins, G., Rusu, A.A., Milan, K., Quan, J., Ramalho, T., Grabska-Barwinska, A., Hassabis, D.: Overcoming catastrophic forgetting in neural networks. Proc. Nat. Acad. Sci. 201611835 (2017)","DOI":"10.1073\/pnas.1611835114"},{"issue":"3","key":"27_CR10","doi-asserted-by":"publisher","first-page":"247","DOI":"10.1109\/TSSC.1969.300268","volume":"5","author":"A Klopf","year":"1969","unstructured":"Klopf, A., Gose, E.: An evolutionary pattern recognition network. IEEE Trans. Syst. Sci. Cybern. 5(3), 247\u2013250 (1969)","journal-title":"IEEE Trans. Syst. Sci. Cybern."},{"key":"27_CR11","unstructured":"LeCun, Y., Cortes, C., Burges., C.: The MNIST database of handwritten digits (1988)"},{"issue":"39","key":"27_CR12","first-page":"1","volume":"17","author":"S Levine","year":"2016","unstructured":"Levine, S., Finn, C., Darrell, T., Abbeel, P.: End-to-end training of deep visuomotor policies. J. Mach. Learn. Res. 17(39), 1\u201340 (2016)","journal-title":"J. Mach. Learn. Res."},{"issue":"Nov","key":"27_CR13","first-page":"2579","volume":"9","author":"LVD Maaten","year":"2008","unstructured":"Maaten, L.V.D., Hinton, G.: Visualizing data using t-SNE. J. Mach. Learn. Res. 9(Nov), 2579\u20132605 (2008)","journal-title":"J. Mach. Learn. Res."},{"key":"27_CR14","unstructured":"Mahmood, A.R., Sutton, R.S.: Representation search through generate and test. In: AAAI Workshop, Learning Rich Representations from Low-Level Sensors, June 2013"},{"key":"27_CR15","doi-asserted-by":"crossref","unstructured":"Miotto, R., Li, L., Kidd, B.A., Dudley, J.T.: Deep patient: an unsupervised representation to predict the future of patients from the electronic health records. Scientific reports 6, 26094 (2016)","DOI":"10.1038\/srep26094"},{"issue":"7540","key":"27_CR16","doi-asserted-by":"publisher","first-page":"529","DOI":"10.1038\/nature14236","volume":"518","author":"V Mnih","year":"2015","unstructured":"Mnih, V., Kavukcuoglu, K., Silver, D., Rusu, A.A., Veness, J., Bellemare, M.G., Graves, A., Riedmiller, M., Fidjeland, A.K., Ostrovski, G., Petersen, S.: Human-level control through deep reinforcement learning. Nature 518(7540), 529\u2013533 (2015)","journal-title":"Nature"},{"key":"27_CR17","doi-asserted-by":"crossref","unstructured":"Morav\u010d\u00edk, M., Schmid, M., Burch, N., Lis, V., Morrill, D., Bard, N., Davis, T., Waugh, K., Johanson, M., Bowling, M.: Deepstack: Expert-level artificial intelligence in no-limit poker (2017). arXiv preprint arXiv:1701.01724","DOI":"10.1126\/science.aam6960"},{"issue":"23","key":"27_CR18","doi-asserted-by":"publisher","first-page":"3311","DOI":"10.1016\/S0042-6989(97)00169-7","volume":"37","author":"BA Olshausen","year":"1997","unstructured":"Olshausen, B.A., Field, D.J.: Sparse coding with an overcomplete basis set: a strategy employed by V1? Vis. Res. 37(23), 3311\u20133325 (1997)","journal-title":"Vis. Res."},{"key":"27_CR19","doi-asserted-by":"crossref","unstructured":"Papernot, N., McDaniel, P., Jha, S., Fredrikson, M., Celik, Z.B., Swami, A.: The limitations of deep learning in adversarial settings. In: 2016 IEEE European Symposium on Security and Privacy (EuroS&P), pp. 372\u2013387. IEEE, March 2016","DOI":"10.1109\/EuroSP.2016.36"},{"key":"27_CR20","doi-asserted-by":"crossref","unstructured":"Ring, M.B.: CHILD: a first step towards continual learning. Mach. Learn. 28(1), 77\u2013104 (1997)","DOI":"10.1023\/A:1007331723572"},{"issue":"3","key":"27_CR21","first-page":"1","volume":"5","author":"DE Rumelhart","year":"1988","unstructured":"Rumelhart, D.E., Hinton, G.E., Williams, R.J.: Learning representations by back-propagating errors. Cogn. Model. 5(3), 1 (1988)","journal-title":"Cogn. Model."},{"key":"27_CR22","doi-asserted-by":"crossref","unstructured":"Schraudolph, N.N.: Local gain adaptation in stochastic gradient descent (1999)","DOI":"10.1049\/cp:19991170"},{"issue":"1","key":"27_CR23","doi-asserted-by":"publisher","first-page":"94","DOI":"10.1109\/TPAMI.2014.2343229","volume":"37","author":"A Sironi","year":"2015","unstructured":"Sironi, A., Tekin, B., Rigamonti, R., Lepetit, V., Fua, P.: Learning separable filters. IEEE Trans. Pattern Anal. Mach. Intell. 37(1), 94\u2013106 (2015)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"27_CR24","unstructured":"Sutton, R.S.: Two problems with backpropagation and other steepest-descent learning procedures for networks. In: Proceeding of 8th Annual Conference on Cognitive Science Society, pp. 823\u2013831. Erlbaum, May 1986"},{"key":"27_CR25","unstructured":"Sutton, R.S.: Adapting bias by gradient descent: an incremental version of delta-bar-delta. In: AAAI, pp. 171\u2013176, July 1992"},{"key":"27_CR26","unstructured":"Sutton, R.S.: Myths of representation learning. In: ICLR (2014). Lecture"},{"key":"27_CR27","doi-asserted-by":"crossref","unstructured":"Szegedy, C., Ioffe, S., Vanhoucke, V., Alemi, A.A.: Inception-v4, inception-ResNet and the impact of residual connections on learning. In: AAAI, pp. 4278\u20134284 (2017)","DOI":"10.1609\/aaai.v31i1.11231"},{"issue":"2","key":"27_CR28","first-page":"26","volume":"4","author":"T Tieleman","year":"2012","unstructured":"Tieleman, T., Hinton, G.: Lecture 6.5-rmsprop: divide the gradient by a running average of its recent magnitude. COURSERA: Neural Netw. Mach. Learn. 4(2), 26\u201331 (2012)","journal-title":"Mach. Learn."},{"issue":"Dec","key":"27_CR29","first-page":"3371","volume":"11","author":"P Vincent","year":"2010","unstructured":"Vincent, P., Larochelle, H., Lajoie, I., Bengio, Y., Manzagol, P.A.: Stacked denoising autoencoders: learning useful representations in a deep network with a local denoising criterion. J. Mach. Learn. Res. 11(Dec), 3371\u20133408 (2010)","journal-title":"J. Mach. Learn. Res."},{"key":"27_CR30","unstructured":"Wu, Y., Schuster, M., Chen, Z., Le, Q.V., Norouzi, M., Macherey, W., ... Klingner, J.: Google\u2019s neural machine translation system: bridging the gap between human and machine translation (2016). arXiv preprint arXiv:1609.08144"},{"key":"27_CR31","unstructured":"Zeiler, M.D.: ADADELTA: an adaptive learning rate method (2012). arXiv preprint arXiv:1212.5701"}],"container-title":["Lecture Notes in Computer Science","Machine Learning and Knowledge Discovery in Databases"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-71249-9_27","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,12,29]],"date-time":"2022-12-29T01:29:25Z","timestamp":1672277365000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-319-71249-9_27"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017]]},"ISBN":["9783319712482","9783319712499"],"references-count":31,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-71249-9_27","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2017]]},"assertion":[{"value":"30 December 2017","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECML PKDD","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Joint European Conference on Machine Learning and Knowledge Discovery in Databases","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Skopje","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Macedonia","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2017","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18 September 2017","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"22 September 2017","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"17","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"ecml2017","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/ecmlpkdd2017.ijs.si\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}