{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,15]],"date-time":"2024-09-15T14:37:15Z","timestamp":1726411035979},"publisher-location":"Singapore","reference-count":12,"publisher":"Springer Singapore","isbn-type":[{"type":"print","value":"9789811310553"},{"type":"electronic","value":"9789811310560"}],"license":[{"start":{"date-parts":[[2018,7,24]],"date-time":"2018-07-24T00:00:00Z","timestamp":1532390400000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019]]},"DOI":"10.1007\/978-981-13-1056-0_63","type":"book-chapter","created":{"date-parts":[[2018,7,23]],"date-time":"2018-07-23T12:30:31Z","timestamp":1532349031000},"page":"643-651","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["A Hybrid Deep Q-Network for the SVM Lagrangian"],"prefix":"10.1007","author":[{"given":"Chayoung","family":"Kim","sequence":"first","affiliation":[]},{"given":"Hye-young","family":"Kim","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,7,24]]},"reference":[{"key":"63_CR1","doi-asserted-by":"publisher","first-page":"389","DOI":"10.1023\/A:1012487302797","volume":"46","author":"I Guyon","year":"2002","unstructured":"Guyon I, Weston J, Barnhill S, Vapnik V (2002) Gene selection for cancer classification using support vector machine. Mach Learn 46:389\u2013422","journal-title":"Mach Learn"},{"key":"63_CR2","doi-asserted-by":"crossref","unstructured":"Chao C-F, Horng M-H (2015) The construction of support vector machine classifier using the firefly algorithm. Comput Intell Neurosci Arch 2015(2)","DOI":"10.1155\/2015\/212719"},{"issue":"1","key":"63_CR3","first-page":"9","volume":"3","author":"RS Sutton","year":"1988","unstructured":"Sutton RS (1988) Learning to predict by the methods of temporal differences. Mach Learn 3(1):9\u201344","journal-title":"Mach Learn"},{"key":"63_CR4","unstructured":"Sutton RS, Barto AG (1998) Reinforcement learning: an introduction, vol 1. MIT press Cambridge"},{"key":"63_CR5","unstructured":"Sutton RS, McAllester DA, Singh SP, Mansour Y (1999) Policy gradient methods for reinforcement learning with function approximation. In: NIPS, vol 99, pp 1057\u20131063 (1999)"},{"key":"63_CR6","unstructured":"Sutton RS (1984) Temporal credit assignment in reinforcement learning. Doctoral Dissertation"},{"key":"63_CR7","unstructured":"Tieleman T, Hinton G (2012) Lecture 6.5-rmsprop: divide the gradient by a running average of its recent magnitude. COURSERA: Neural Netw Mach Learn 4(2)"},{"key":"63_CR8","unstructured":"Silver D, Lever G, Heess N (2014) Deterministic policy gradient algorithms. In: ICML\u201914 proceedings of the 31st international conference on international conference on machine learning vol 32, pp 387\u2013395"},{"issue":"7587","key":"63_CR9","doi-asserted-by":"publisher","first-page":"484","DOI":"10.1038\/nature16961","volume":"529","author":"David Silver","year":"2016","unstructured":"Silver D, Huang A, Maddison CJ, Guez A, Sifre L, Driessche GVD, Schrittwieser J, Antonoglou I, Panneershelvam V, Lanctot M (2016) Mastering the game of go with deep neural networks and tree search. Nature, 529(7587):484\u2013489","journal-title":"Nature"},{"key":"63_CR10","unstructured":"Mnih V, Kavukcuoglu K, Silver D, Graves A, Antonoglou I, Wierstra D, Riedmiller M (2013) Playing atari with deep reinforcement learning. In: NIPS"},{"key":"63_CR11","unstructured":"Hansen S (2016) Using deep q-learning to control optimization hyperparameters. ArXiv"},{"key":"63_CR12","doi-asserted-by":"crossref","unstructured":"Tavallaee M, Bagheri E, Lu W, Ghorbani AA (2009) A detailed analysis of the KDD CUP 99 dataset. In: Proceedings of the 2009 IEEE symposium on computational intelligence in security and defense applications (CISDA 2009), pp 53\u201358","DOI":"10.1109\/CISDA.2009.5356528"}],"container-title":["Lecture Notes in Electrical Engineering","Information Science and Applications 2018"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-13-1056-0_63","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,10,21]],"date-time":"2019-10-21T01:17:12Z","timestamp":1571620632000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-981-13-1056-0_63"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,7,24]]},"ISBN":["9789811310553","9789811310560"],"references-count":12,"URL":"https:\/\/doi.org\/10.1007\/978-981-13-1056-0_63","relation":{},"ISSN":["1876-1100","1876-1119"],"issn-type":[{"type":"print","value":"1876-1100"},{"type":"electronic","value":"1876-1119"}],"subject":[],"published":{"date-parts":[[2018,7,24]]}}}