{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,3]],"date-time":"2025-11-03T13:32:44Z","timestamp":1762176764168,"version":"3.40.3"},"publisher-location":"Berlin, Heidelberg","reference-count":23,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783662453902"},{"type":"electronic","value":"9783662453919"}],"license":[{"start":{"date-parts":[[2014,1,1]],"date-time":"2014-01-01T00:00:00Z","timestamp":1388534400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014]]},"DOI":"10.1007\/978-3-662-45391-9_11","type":"book-chapter","created":{"date-parts":[[2014,10,10]],"date-time":"2014-10-10T00:01:44Z","timestamp":1412899304000},"page":"154-168","source":"Crossref","is-referenced-by-count":26,"title":["Integrating On-policy Reinforcement Learning with Multi-agent Techniques for Adaptive Service Composition"],"prefix":"10.1007","author":[{"given":"Hongbing","family":"Wang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xin","family":"Chen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qin","family":"Wu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qi","family":"Yu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zibin","family":"Zheng","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Athman","family":"Bouguettaya","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","reference":[{"issue":"6","key":"11_CR1","doi-asserted-by":"publisher","first-page":"369","DOI":"10.1109\/TSE.2007.1011","volume":"33","author":"D. Ardagna","year":"2007","unstructured":"Ardagna, D., Pernici, B.: Adaptive service composition in flexible processes. IEEE Transactions on Software Engineering\u00a033(6), 369\u2013384 (2007)","journal-title":"IEEE Transactions on Software Engineering"},{"key":"11_CR2","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"530","DOI":"10.1007\/978-3-540-89652-4_42","volume-title":"Service-Oriented Computing \u2013 ICSOC 2008","author":"S. Beauche","year":"2008","unstructured":"Beauche, S., Poizat, P.: Automated service composition with adaptive planning. In: Bouguettaya, A., Krueger, I., Margaria, T. (eds.) ICSOC 2008. LNCS, vol.\u00a05364, pp. 530\u2013537. Springer, Heidelberg (2008)"},{"issue":"2","key":"11_CR3","doi-asserted-by":"publisher","first-page":"156","DOI":"10.1109\/TSMCC.2007.913919","volume":"38","author":"L. Busoniu","year":"2008","unstructured":"Busoniu, L., Babuska, R., De Schutter, B.: A comprehensive survey of multiagent reinforcement learning. IEEE Transactions on Systems, Man, and Cybernetics, Part C: Applications and Reviews\u00a038(2), 156\u2013172 (2008)","journal-title":"IEEE Transactions on Systems, Man, and Cybernetics, Part C: Applications and Reviews"},{"key":"11_CR4","unstructured":"Claus, C., Boutilier, C.: The dynamics of reinforcement learning in cooperative multiagent systems. In: AAAI\/IAAI, pp. 746\u2013752 (1998)"},{"key":"11_CR5","series-title":"CCIS","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/978-3-642-17625-8_1","volume-title":"Grid and Distributed Computing, Control and Automation","author":"J.O. Gutierrez-Garcia","year":"2010","unstructured":"Gutierrez-Garcia, J.O., Sim, K.-M.: Agent-based service composition in cloud computing. In: Kim, T.-h., Yau, S.S., Gervasi, O., Kang, B.-H., Stoica, A., \u015al\u0119zak, D. (eds.) GDC and CA 2010. CCIS, vol.\u00a0121, pp. 1\u201310. Springer, Heidelberg (2010)"},{"key":"11_CR6","unstructured":"Hu, J., Wellman, M.P.: Multiagent reinforcement learning: theoretical framework and an algorithm. In: ICML, vol.\u00a098, pp. 242\u2013250. Citeseer (1998)"},{"key":"11_CR7","doi-asserted-by":"crossref","unstructured":"Jureta, I.J., Faulkner, S., Achbany, Y., Saerens, M.: Dynamic web service composition within a service-oriented architecture. In: IEEE International Conference on Web Services, ICWS 2007, pp. 304\u2013311. IEEE (2007)","DOI":"10.1109\/ICWS.2007.79"},{"issue":"2","key":"11_CR8","first-page":"105","volume":"2","author":"V. K\u00f6n\u00f6nen","year":"2004","unstructured":"K\u00f6n\u00f6nen, V.: Asymmetric multiagent reinforcement learning. Web Intelligence and Agent Systems\u00a02(2), 105\u2013121 (2004)","journal-title":"Web Intelligence and Agent Systems"},{"key":"11_CR9","doi-asserted-by":"crossref","unstructured":"Littman, M.L.: Markov games as a framework for multi-agent reinforcement learning. In: ICML, vol.\u00a094, pp. 157\u2013163 (1994)","DOI":"10.1016\/B978-1-55860-335-6.50027-1"},{"issue":"1","key":"11_CR10","doi-asserted-by":"publisher","first-page":"55","DOI":"10.1016\/S1389-0417(01)00015-8","volume":"2","author":"M.L. Littman","year":"2001","unstructured":"Littman, M.L.: Value-function reinforcement learning in markov games. Cognitive Systems Research\u00a02(1), 55\u201366 (2001)","journal-title":"Cognitive Systems Research"},{"issue":"5","key":"11_CR11","doi-asserted-by":"publisher","first-page":"686","DOI":"10.1109\/TKDE.2005.82","volume":"17","author":"Z. Maamar","year":"2005","unstructured":"Maamar, Z., Mostefaoui, S.K., Yahyaoui, H.: Toward an agent-based and context-oriented approach for web services composition. IEEE Transactions on Knowledge and Data Engineering\u00a017(5), 686\u2013697 (2005)","journal-title":"IEEE Transactions on Knowledge and Data Engineering"},{"issue":"1","key":"11_CR12","doi-asserted-by":"publisher","first-page":"258","DOI":"10.1006\/jeth.1996.0014","volume":"68","author":"D. Monderer","year":"1996","unstructured":"Monderer, D., Shapley, L.S.: Fictitious play property for games with identical interests. Journal of Economic Theory\u00a068(1), 258 (1996)","journal-title":"Journal of Economic Theory"},{"key":"11_CR13","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"298","DOI":"10.1007\/978-3-642-45005-1_21","volume-title":"Service-Oriented Computing","author":"A. Moustafa","year":"2013","unstructured":"Moustafa, A., Zhang, M.: Multi-objective service composition using reinforcement learning. In: Basu, S., Pautasso, C., Zhang, L., Fu, X. (eds.) ICSOC 2013. LNCS, vol.\u00a08274, pp. 298\u2013312. Springer, Heidelberg (2013)"},{"issue":"1","key":"11_CR14","doi-asserted-by":"publisher","first-page":"15","DOI":"10.1109\/TSC.2008.1","volume":"1","author":"S.C. Oh","year":"2008","unstructured":"Oh, S.C., Lee, D., Kumara, S.R.: Effective web service composition in diverse and large-scale service networks. IEEE Transactions on Services Computing\u00a01(1), 15\u201332 (2008)","journal-title":"IEEE Transactions on Services Computing"},{"key":"11_CR15","doi-asserted-by":"crossref","unstructured":"Panait, L., Luke, S.: Cooperative multi-agent learning: The state of the art. In: Proceedings of 2005 Autonomous Agents and Multi-Agent Systems(AAMAS), vol.\u00a011(3), pp. 387\u2013434 (November 2005)","DOI":"10.1007\/s10458-005-2631-2"},{"issue":"1","key":"11_CR16","doi-asserted-by":"crossref","first-page":"45","DOI":"10.3233\/NGS-130201","volume":"9","author":"P. Papadopoulos","year":"2013","unstructured":"Papadopoulos, P., Tianfield, H., Moffat, D., Barrie, P.: Decentralized multi-agent service composition. Multiagent and Grid Systems\u00a09(1), 45\u2013100 (2013)","journal-title":"Multiagent and Grid Systems"},{"key":"11_CR17","unstructured":"Rummery, G.A., Niranjan, M.: On-line Q-learning using connectionist systems. University of Cambridge, Department of Engineering (1994)"},{"key":"11_CR18","unstructured":"Sutton, R.S., Barto, A.G.: Reinforcement learning: An introduction, vol.\u00a01. Cambridge Univ. Press (1998)"},{"key":"11_CR19","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"220","DOI":"10.1007\/978-3-642-37401-2_23","volume-title":"Web Technologies and Applications","author":"H. Wang","year":"2013","unstructured":"Wang, H., Wang, X.: A novel approach to large-scale services composition. In: Ishikawa, Y., Li, J., Wang, W., Zhang, R., Zhang, W. (eds.) APWeb 2013. LNCS, vol.\u00a07808, pp. 220\u2013227. Springer, Heidelberg (2013)"},{"key":"11_CR20","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"92","DOI":"10.1007\/978-3-642-17358-5_7","volume-title":"Service-Oriented Computing","author":"H. Wang","year":"2010","unstructured":"Wang, H., Zhou, X., Zhou, X., Liu, W., Li, W., Bouguettaya, A.: Adaptive service composition based on reinforcement learning. In: Maglio, P.P., Weske, M., Yang, J., Fantinato, M. (eds.) ICSOC 2010. LNCS, vol.\u00a06470, pp. 92\u2013107. Springer, Heidelberg (2010)"},{"key":"11_CR21","unstructured":"Wang, X., Sandholm, T.: Reinforcement learning to play an optimal nash equilibrium in team markov games. In: NIPS, vol.\u00a015, pp. 1571\u20131578 (2002)"},{"key":"11_CR22","doi-asserted-by":"crossref","unstructured":"Xu, W., Cao, J., Zhao, H., Wang, L.: A multi-agent learning model for service composition. In: 2012 IEEE Asia-Pacific Services Computing Conference (APSCC), pp. 70\u201375. IEEE (2012)","DOI":"10.1109\/APSCC.2012.44"},{"issue":"1","key":"11_CR23","doi-asserted-by":"publisher","first-page":"57","DOI":"10.2307\/2951778","volume":"61","author":"H.P. Young","year":"1993","unstructured":"Young, H.P.: The evolution of conventions. Econometrica\u00a061(1), 57\u201384 (1993)","journal-title":"Econometrica"}],"container-title":["Lecture Notes in Computer Science","Service-Oriented Computing"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-662-45391-9_11","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,10,26]],"date-time":"2019-10-26T20:12:23Z","timestamp":1572120743000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-662-45391-9_11"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014]]},"ISBN":["9783662453902","9783662453919"],"references-count":23,"URL":"https:\/\/doi.org\/10.1007\/978-3-662-45391-9_11","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2014]]}}}