{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,26]],"date-time":"2025-03-26T02:07:56Z","timestamp":1742954876906,"version":"3.40.3"},"publisher-location":"Cham","reference-count":7,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319314464"},{"type":"electronic","value":"9783319314471"}],"license":[{"start":{"date-parts":[[2016,1,1]],"date-time":"2016-01-01T00:00:00Z","timestamp":1451606400000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016]]},"DOI":"10.1007\/978-3-319-31447-1_11","type":"book-chapter","created":{"date-parts":[[2016,3,14]],"date-time":"2016-03-14T01:10:30Z","timestamp":1457917830000},"page":"159-172","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Optimality and Equilibrium of Exploration Ratio for Multiagent Learning in Nonstationary Environments"],"prefix":"10.1007","author":[{"given":"Itsuki","family":"Noda","sequence":"first","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2016,3,15]]},"reference":[{"key":"11_CR1","unstructured":"Kaisers, M., Tuyls, K.: Frequency adjusted multi-agent q-learning. In: Proceedings of 9th International Conference on Autonomous Agents and Multiagent Systems (AAMAS 2010), pp. 309\u2013315, May 2010"},{"key":"11_CR2","doi-asserted-by":"crossref","unstructured":"Noda, I.: Limitations of simultaneous multiagent learning in nonstationary environments. In: Proceedings of 2013 IEEE\/WIC\/ACM International Conference on Intelligent Agent Technology (IAT 2013), pp. 309\u2013314. IEEE, November 2013","DOI":"10.1109\/WI-IAT.2013.125"},{"key":"11_CR3","unstructured":"Noda, I.: Robustness of optimality of exploration ratio against agent population in multiagent learning for nonstationary environments. In: Multiagent Interaction Without Prior Coordination (Technical report WS-14-09), pp. 28\u201334. AAAI, July 2014"},{"key":"11_CR4","volume-title":"Reinforcement Learning: An Introduction","author":"RS Sutton","year":"1998","unstructured":"Sutton, R.S., Barto, A.G.: Reinforcement Learning: An Introduction. MIT Press, Cambridge (1998)"},{"key":"11_CR5","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"203","DOI":"10.1007\/978-3-642-16111-7_23","volume-title":"KI 2010: Advances in Artificial Intelligence","author":"M Tokic","year":"2010","unstructured":"Tokic, M.: Adaptive \n                      \n                        \n                      \n                      $$\\epsilon $$\n                      \n                        \n                          \u03f5\n                        \n                      \n                    -greedy exploration in reinforcement learning based on value differences. In: Dillmann, R., Beyerer, J., Hanebeck, U.D., Schultz, T. (eds.) KI 2010. LNCS, vol. 6359, pp. 203\u2013210. Springer, Heidelberg (2010)"},{"key":"11_CR6","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"335","DOI":"10.1007\/978-3-642-24455-1_33","volume-title":"KI 2011: Advances in Artificial Intelligence","author":"M Tokic","year":"2011","unstructured":"Tokic, M., Palm, G.: Value-difference based exploration: adaptive control between epsilon-greedy and softmax. In: Bach, J., Edelkamp, S. (eds.) KI 2011. LNCS, vol. 7006, pp. 335\u2013346. Springer, Heidelberg (2011)"},{"key":"11_CR7","unstructured":"Wunder, M., Littman, M.L., Babes, M.: Classes of multiagent q-learning dynamicswith epsilon-greedy exploration. In: Frnkranz, J., Joachims, T. (eds.) Proceedings of the 27th International Conference on Machine Learning (ICML 2010), pp. 1167\u20131174. Omnipress (2010). \n                      http:\/\/www.icml2010.org\/papers\/191.pdf"}],"container-title":["Lecture Notes in Computer Science","Multi-Agent Based Simulation XVI"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-31447-1_11","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,6,1]],"date-time":"2019-06-01T14:47:44Z","timestamp":1559400464000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-31447-1_11"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016]]},"ISBN":["9783319314464","9783319314471"],"references-count":7,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-31447-1_11","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2016]]},"assertion":[{"value":"15 March 2016","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}