{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,9]],"date-time":"2024-09-09T14:08:25Z","timestamp":1725890905504},"publisher-location":"Berlin, Heidelberg","reference-count":38,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540653110"},{"type":"electronic","value":"9783540494300"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[1998]]},"DOI":"10.1007\/3-540-49430-8_9","type":"book-chapter","created":{"date-parts":[[2007,8,11]],"date-time":"2007-08-11T14:57:33Z","timestamp":1186844253000},"page":"165-191","source":"Crossref","is-referenced-by-count":17,"title":["A Dozen Tricks with Multitask Learning"],"prefix":"10.1007","author":[{"given":"Rich","family":"Caruana","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2002,3,28]]},"reference":[{"issue":"2","key":"9_CR1","doi-asserted-by":"publisher","first-page":"192","DOI":"10.1016\/0885-064X(90)90006-Y","volume":"6","author":"Y. S. Abu-Mostafa","year":"1990","unstructured":"Y. S. Abu-Mostafa, \u201cLearning from Hints in Neural Networks,\u201d Journal of Complexity, 1990, 6(2), pp. 192\u2013198.","journal-title":"Journal of Complexity"},{"key":"9_CR2","doi-asserted-by":"publisher","first-page":"639","DOI":"10.1162\/neco.1995.7.4.639","volume":"7","author":"Y. S. Abu-Mostafa","year":"1995","unstructured":"Y. S. Abu-Mostafa, \u201cHints,\u201d Neural Computation, 1995, 7, pp. 639\u2013671.","journal-title":"Neural Computation"},{"key":"9_CR3","doi-asserted-by":"crossref","unstructured":"J. Baxter, \u201cLearning Internal Representations,\u201d COLT-95, Santa Cruz, CA, 1995.","DOI":"10.1145\/225298.225336"},{"key":"9_CR4","unstructured":"J. Baxter, \u201cLearning Internal Representations,\u201d Ph.D. Thesis, The Flinders Univeristy of South Australia, Dec. 1994."},{"key":"9_CR5","first-page":"41","volume-title":"Proceedings of the 10th International Conference on Machine Learning","author":"R. Caruana","year":"1993","unstructured":"R. Caruana, \u201cMultitask Learning: A Knowledge-Based Source of Inductive Bias,\u201d Proceedings of the 10th International Conference on Machine Learning, ML-93, University of Massachusetts, Amherst, 1993, pp. 41\u201348."},{"key":"9_CR6","unstructured":"R. Caruana, \u201cMultitask Connectionist Learning,\u201d Proceedings of the 1993 Connectionist Models Summer School, 1994, pp. 372\u2013379."},{"key":"9_CR7","doi-asserted-by":"crossref","unstructured":"R. Caruana and D. Freitag, \u201cGreedy Attribute Selection,\u201d ICML-94, 1994, Rutgers, NJ, pp. 28\u201336.","DOI":"10.1016\/B978-1-55860-335-6.50012-X"},{"key":"9_CR8","unstructured":"R. Caruana, \u201cLearning Many Related Tasks at the Same Time with Backpropagation,\u201d NIPS-94, 1995, pp. 656\u2013664."},{"key":"9_CR9","first-page":"959","volume":"8","author":"R. Caruana","year":"1996","unstructured":"R. Caruana, S. Baluja, and T. Mitchell, \u201cUsing the Future to \u201cSort Out\u201d the Present: Rankprop and Multitask Learning for Medical Risk Prediction,\u201d Advances in Neural Information Processing Systems 8, (Proceedings of NIPS-95), 1996, pp. 959\u2013965.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"9_CR10","unstructured":"R. Caruana, and V. R. de Sa, \u201cPromoting Poor Features to Supervisors: Some Inputs Work Better As Outputs,\u201d NIPS-96, 1997."},{"key":"9_CR11","doi-asserted-by":"publisher","first-page":"41","DOI":"10.1023\/A:1007379606734","volume":"28","author":"R. Caruana","year":"1997","unstructured":"R. Caruana, \u201cMultitask Learning,\u201d Machine Learning, 28, pp. 41\u201375, 1997.","journal-title":"Machine Learning"},{"key":"9_CR12","unstructured":"R. Caruana, \u201cMultitask Learning,\u201d Ph.D. thesis, Carnegie Mellon University, CMU-CS-97-203, 1997."},{"key":"9_CR13","unstructured":"R. Caruana and J. O\u2019Sullivan, \u201cMultitask Pattern Recognition for Autonomous Robots,\u201d to appear in The Proceedings of the IEEE Intelligent Robots and Systems Conference, (IROS\u201998), Victoria, 1998."},{"key":"9_CR14","doi-asserted-by":"crossref","unstructured":"R. Caruana and V. R. de Sa, \u201cUsing Feature Selection to Find Inputs that Work Better as Outputs,\u201d to appear in The Proceedings of the International Conference on Neural Nets, (ICANN\u201998), Sweden, 1998.","DOI":"10.1007\/978-1-4471-1599-1_43"},{"key":"9_CR15","doi-asserted-by":"crossref","unstructured":"G. F. Cooper, C. F. Aliferis, R. Ambrosino, J. Aronis, B. G. Buchanan, R. Caruana, M. J. Fine, C. Glymour, G. Gordon, B. H. Hanusa, J. E. Janosky, C. Meek, T. Mitchell, T. Richardson, and P. Spirtes, \u201cAn Evaluation of Machine Learning Methods for Predicting Pneumonia Mortality,\u201d Artificial Intelligence in Medicine 9, 1997, pp. 107\u2013138.","DOI":"10.1016\/S0933-3657(96)00367-3"},{"key":"9_CR16","first-page":"37","volume-title":"Proceedings of the 11th International Conference on Machine Learning","author":"M. Craven","year":"1994","unstructured":"M. Craven and J. Shavlik, \u201cUsing Sampling and Queries to Extract Rules from Trained Neural Networks,\u201d Proceedings of the 11th International Conference on Machine Learning, ML-94, Rutgers University, New Jersey, 1994, pp. 37\u201345."},{"key":"9_CR17","doi-asserted-by":"crossref","unstructured":"I. Davis and A. Stentz, \u201cSensor Fusion for Autonomous Outdoor Navigation Using Neural Networks,\u201d Proceedings of IEEE\u2019s Intelligent Robots and Systems Conference, 1995.","DOI":"10.21236\/ADA293563"},{"key":"9_CR18","doi-asserted-by":"crossref","first-page":"263","DOI":"10.1613\/jair.105","volume":"2","author":"T. G. Dietterich","year":"1995","unstructured":"T. G. Dietterich and G. Bakiri, \u201cSolving Multiclass Learning Problems via Error-Correcting Output Codes,\u201d Journal of Artificial Intelligence Research, 1995, 2, pp. 263\u2013286.","journal-title":"Journal of Artificial Intelligence Research"},{"key":"9_CR19","doi-asserted-by":"crossref","unstructured":"M. J. Fine, D. Singer, B. H. Hanusa, J. Lave, and W. Kapoor, \u201cValidation of a Pneumonia Prognostic Index Using the MedisGroups Comparative Hospital Database,\u201d American Journal of Medicine, 1993.","DOI":"10.1016\/0002-9343(93)90177-Q"},{"key":"9_CR20","unstructured":"Ghosn, J. and Bengio, Y., \u201cMulti-Task Learning for Stock Selection,\u201d NIPS-96, 1997."},{"key":"9_CR21","unstructured":"T. Heskes, \u201cSolving a Huge Number of Similar Tasks: A Combination of Multitask Learning and a Hierarchical Bayesian Approach,\u201d Proceedings of the 15th International Conference on Machine Learning, Madison, Wisconsin, pp. 233\u2013241, 1998."},{"issue":"1","key":"9_CR22","doi-asserted-by":"publisher","first-page":"24","DOI":"10.1109\/72.105415","volume":"3","author":"L. Holmstrom","year":"1992","unstructured":"L. Holmstrom and P. Koistinen, \u201cUsing Additive Noise in Back-propagation Training,\u201d IEEE Transactions on Neural Networks, 1992, 3(1), pp. 24\u201338.","journal-title":"IEEE Transactions on Neural Networks"},{"key":"9_CR23","doi-asserted-by":"crossref","unstructured":"G. John, R. Kohavi, and K. Pfleger, \u201cIrrelevant Features and the Subset Selection Problem,\u201d ICML-94, 1994, Rutgers, NJ, pp. 121\u2013129.","DOI":"10.1016\/B978-1-55860-335-6.50023-4"},{"key":"9_CR24","unstructured":"D. Koller and M. Sahami, \u201cTowards Optimal Feature Selection,\u201d ICML-96, Bari, Italy, 1996, pp. 284\u2013292."},{"key":"9_CR25","doi-asserted-by":"publisher","first-page":"541","DOI":"10.1162\/neco.1989.1.4.541","volume":"1","author":"Y. Cun Le","year":"1989","unstructured":"Y. Le Cun, B. Boser, J. S. Denker, D. Henderson, R. E. Howard, W. Hubbard, and L. D. Jackal, \u201cBackpropagation Applied to Handwritten Zip-Code Recognition,\u201d Neural Computation, 1989, 1, pp. 541\u2013551.","journal-title":"Neural Computation"},{"key":"9_CR26","unstructured":"Y. Le Cun, private communication, 1997."},{"key":"9_CR27","unstructured":"P. W. Munro and B. Parmanto, \u201cCompetition Among Networks Improves Committee Performance,\u201d to appear in Advances in Neural Information Processing Systems 9, (Proceedings of NIPS-96), 1997."},{"key":"9_CR28","doi-asserted-by":"crossref","unstructured":"D. A. Pomerleau, \u201cNeural Network Perception for Mobile Robot Guidance,\u201d Doctoral Thesis, Carnegie Mellon University: CMU-CS-92-115, 1992.","DOI":"10.1007\/978-1-4615-3192-0"},{"key":"9_CR29","unstructured":"L. Y. Pratt, J. Mostow, and C. A. Kamm, \u201cDirect Transfer of Learned Information Among Neural Networks,\u201d Proceedings of AAAI-91, 1991."},{"key":"9_CR30","unstructured":"T. J. Sejnowski and C. R. Rosenberg, \u201cNETtalk: A Parallel Network that Learns to Read Aloud,\u201d John Hopkins: JHU\/EECS-86\/01, 1986."},{"key":"9_CR31","unstructured":"J. Sill and Y. Abu-Mostafa, \u201cMonotonicity Hints,\u201d to appear in Neural Information Processing Systems 9, (Proceedings of NIPS-96), 1997."},{"issue":"3","key":"9_CR32","doi-asserted-by":"publisher","first-page":"291","DOI":"10.1016\/S0020-7373(05)80130-0","volume":"35","author":"S. C. Suddarth","year":"1991","unstructured":"S. C. Suddarth and A. D. C. Holden, \u201cSymbolic-neural Systems and the Use of Hints for Developing Complex Systems,\u201d International Journal of Man-Machine Studies, 1991, 35(3), pp. 291\u2013311.","journal-title":"International Journal of Man-Machine Studies"},{"key":"9_CR33","doi-asserted-by":"crossref","unstructured":"S. C. Suddarth and Y. L. Kergosien, \u201cRule-injection Hints as a Means of Improving Network Performance and Learning Time,\u201d Proceedings of EURASIP Workshop on Neural Nets, 1990, pp. 120\u2013129.","DOI":"10.1007\/3-540-52255-7_33"},{"key":"9_CR34","doi-asserted-by":"crossref","unstructured":"S. Thrun, Explanation-Based Neural Network Learning: A Lifelong Learning Approach, 1996, Kluwer Academic Publisher.","DOI":"10.1007\/978-1-4613-1381-6"},{"key":"9_CR35","unstructured":"S. Thrun and L. Pratt, editors, Machine Learning. Second Special Issue on Inductive Transfer, 1997."},{"key":"9_CR36","doi-asserted-by":"crossref","unstructured":"S. Thrun and L. Pratt, editors, Learning to Learn, Kluwer, 1997.","DOI":"10.1007\/978-1-4615-5529-2"},{"key":"9_CR37","first-page":"326","volume-title":"Proceedings of the 11th International Conference on Machine Learning","author":"R. Valdes-Perez","year":"1994","unstructured":"R. Valdes-Perez and H. A. Simon, \u201cA Powerful Heuristic for the Discovery of Complex Patterned Behavior,\u201d Proceedings of the 11th International Conference on Machine Learning, ML-94, Rutgers University, New Jersey, 1994, pp. 326\u2013334."},{"key":"9_CR38","unstructured":"A. Weigend, D. Rumelhart, and B. Huberman, \u201cGeneralization by Weight-Elimination with Application to Forecasting,\u201d Advances in Neural Information Processing Systems 3, (Proceedings of NIPS-90), 1991, pp. 875\u2013882."}],"container-title":["Lecture Notes in Computer Science","Neural Networks: Tricks of the Trade"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/3-540-49430-8_9","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,1]],"date-time":"2019-05-01T23:30:15Z","timestamp":1556753415000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/3-540-49430-8_9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[1998]]},"ISBN":["9783540653110","9783540494300"],"references-count":38,"URL":"https:\/\/doi.org\/10.1007\/3-540-49430-8_9","relation":{},"ISSN":["0302-9743"],"issn-type":[{"type":"print","value":"0302-9743"}],"subject":[],"published":{"date-parts":[[1998]]}}}