{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,7]],"date-time":"2026-03-07T05:53:09Z","timestamp":1772862789654,"version":"3.50.1"},"reference-count":37,"publisher":"Springer Science and Business Media LLC","issue":"3-4","license":[{"start":{"date-parts":[[2025,2,1]],"date-time":"2025-02-01T00:00:00Z","timestamp":1738368000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,2,1]],"date-time":"2025-02-01T00:00:00Z","timestamp":1738368000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Wireless Pers Commun"],"published-print":{"date-parts":[[2025,2]]},"DOI":"10.1007\/s11277-025-11753-z","type":"journal-article","created":{"date-parts":[[2025,4,4]],"date-time":"2025-04-04T08:19:52Z","timestamp":1743754792000},"page":"945-969","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Optimizing Relay Selection in D2D Communication for Next-Generation Wireless Networks Using Multi-Agent Reinforcement Learning: A Novel Approach"],"prefix":"10.1007","volume":"140","author":[{"given":"Muharrem","family":"Sirma","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Adnan","family":"Kavak","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"A. Burak","family":"Inner","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,4,2]]},"reference":[{"key":"11753_CR1","doi-asserted-by":"publisher","unstructured":"Driouech, S., Sabir,E., & Bennis, M. (2020) D2D Mobile Relaying for Efficient Throughput-Reliability Delivering in 5G, ICC 2020 - 2020 IEEE international conference on communications (ICC), Dublin, Ireland pp. 1-7, https:\/\/doi.org\/10.1109\/ICC40277.2020.9148893.","DOI":"10.1109\/ICC40277.2020.9148893."},{"key":"11753_CR2","doi-asserted-by":"publisher","unstructured":"Delgado, O., & Labeau, F. (2016) D2D relay selection and fairness on 5G wireless networks,. IEEE globecom workshops (GC Wkshps). Washington, DC, 2016, 1\u20136. https:\/\/doi.org\/10.1109\/GLOCOMW.2016.7848868","DOI":"10.1109\/GLOCOMW.2016.7848868"},{"key":"11753_CR3","doi-asserted-by":"publisher","unstructured":"Zhang, X., Lin, Z., Ding, B., Gu, B., & Han, Y. (2020). Deep Multi-Agent reinforcement learning for resource allocation in D2D communication underlaying cellular networks. 21st Asia-Spacific network operations and management symposium (APNOMS), Daegu. Korea (South), 2020, 55\u201360. https:\/\/doi.org\/10.23919\/APNOMS50412.2020.9237060","DOI":"10.23919\/APNOMS50412.2020.9237060"},{"key":"11753_CR4","doi-asserted-by":"publisher","unstructured":"Murkaz FN (2016). : Architecture and protocols for inter-cell device-to-device communication in 5G networks, et al. IEEE 14th Int, l conf on dependable, autonomic and secure computing, 14th Int, l conf on pervasive intelligence and computing, 2nd int, l conf on big data intelligence and computing and cyber science and technology congress (DASC\/PiCom\/DataCom\/CyberSciTech). Auckland, 2016, 489\u2013492. https:\/\/doi.org\/10.1109\/DASC-PICom-DataCom-CyberSciTec.2016.95","DOI":"10.1109\/DASC-PICom-DataCom-CyberSciTec.2016.95"},{"issue":"7","key":"11753_CR5","doi-asserted-by":"publisher","first-page":"4417","DOI":"10.1109\/TWC.2018.2825318","volume":"17","author":"H Shah-Mansouri, Ma","year":"2018","unstructured":"Shah-Mansouri, Ma, H., & Wong, V. . W. . S. (2018). Full-duplex relaying for D2D communication in millimeter wave-based 5G networks. IEEE Transactions on Wireless Communications, 17(7), 4417\u20134431. https:\/\/doi.org\/10.1109\/TWC.2018.2825318","journal-title":"IEEE Transactions on Wireless Communications"},{"key":"11753_CR6","doi-asserted-by":"publisher","unstructured":"Jayakumar, S., & S, N. (2021). A review on resource allocation techniques in D2D communication for 5G and B5G technology. Peer-to-Peer Netw. Appl. 14, 243-269. https:\/\/doi.org\/10.1007\/s12083-020-00962-x.","DOI":"10.1007\/s12083-020-00962-x"},{"key":"11753_CR7","doi-asserted-by":"publisher","unstructured":"Uyoata, U., & Dlodlo, M. (2017) Joint power allocation and relay selection for relay assisted D2D communication with channel uncertainties, IEEE EUROCON 2017 -17th international conference on smart technologies, pp. 486-490, https:\/\/doi.org\/10.1109\/EUROCON.2017.8011158.","DOI":"10.1109\/EUROCON.2017.8011158."},{"key":"11753_CR8","doi-asserted-by":"publisher","first-page":"71","DOI":"10.1016\/j.jnca.2018.10.012","volume":"129","author":"Pedhadiya Mittal K","year":"2019","unstructured":"Mittal K, Pedhadiya, Jha, Rakesh Kumar, & Bhatt, Hetal G.. (2019). Device to device communication: A surveyJournal of Network and Computer Applications, 129, 71\u201389. https:\/\/doi.org\/10.1016\/j.jnca.2018.10.012. ISSN 1084-8045.","journal-title":"Journal of Network and Computer Applications"},{"issue":"6","key":"11753_CR9","doi-asserted-by":"publisher","first-page":"6452","DOI":"10.1109\/TVT.2020.2985873","volume":"69","author":"X Wang","year":"2020","unstructured":"Wang, X., Jin, T., Hu, L., & Qian, Z. (2020). Energy-efficient power allocation and Q-learning-based relay selection for relay-aided D2D communication. IEEE Transactions on Vehicular Technology, 69(6), 6452\u20136462. https:\/\/doi.org\/10.1109\/TVT.2020.2985873","journal-title":"IEEE Transactions on Vehicular Technology"},{"key":"11753_CR10","doi-asserted-by":"publisher","unstructured":"Shamganth, K., & Sibley, M. J. N. (2017) A survey on relay selection in cooperative device-to-device (D2D) communication for 5G cellular networks, 2017 international conference on energy, communication, data analytics and soft computing (ICECDS), pp. 42-46, https:\/\/doi.org\/10.1109\/ICECDS.2017.8390216.","DOI":"10.1109\/ICECDS.2017.8390216."},{"key":"11753_CR11","doi-asserted-by":"publisher","unstructured":"Mishra, P. K., Mishra, A. K., & Tripathi, S. (2019). Relay selection scheme for dynamic network scenario in multi-hop D2D communication, 2019 IEEE 4th International conference on computer and communication systems (ICCCS), pp. 538-542, https:\/\/doi.org\/10.1109\/CCOMS.2019.8821780.","DOI":"10.1109\/CCOMS.2019.8821780."},{"issue":"5","key":"11753_CR12","doi-asserted-by":"publisher","first-page":"1357","DOI":"10.1109\/LWC.2019.2917907","volume":"8","author":"P Zhang","year":"2019","unstructured":"Zhang, P., Kang, X., Li, X., Liu, Y., Wu, D., & Wang, R. (2019). Overlapping community deep exploring-based relay selection method toward multi-hop D2D communication. IEEE Wireless Communications Letters, 8(5), 1357\u20131360. https:\/\/doi.org\/10.1109\/LWC.2019.2917907","journal-title":"IEEE Wireless Communications Letters"},{"key":"11753_CR13","doi-asserted-by":"publisher","unstructured":"Mukhopadhyay, R., Neogy, S., & Chattopadhyay, S. (2020). Dynamic relay selection using a greedy cluster strategy. IEEE international conference on advanced networks and telecommunications systems (ANTS),2020, 1\u20134. https:\/\/doi.org\/10.1109\/ANTS50601.2020.9342757","DOI":"10.1109\/ANTS50601.2020.9342757"},{"key":"11753_CR14","doi-asserted-by":"publisher","unstructured":"Panwar, Nisha, Sharma, Shantanu, & Singh, Awadhesh Kumar: (2016) A survey on 5G: The next generation of mobile communication, Physical Communication, Volume 18, Part 2, Pages 64-84, ISSN 1874-4907, https:\/\/doi.org\/10.1016\/j.phycom.2015.10.006.","DOI":"10.1016\/j.phycom.2015.10.006."},{"issue":"7","key":"11753_CR15","doi-asserted-by":"publisher","first-page":"4379","DOI":"10.1109\/TWC.2021.3058636","volume":"20","author":"CV Anamuro","year":"2021","unstructured":"Anamuro, C. V., Varsier, N., Schwoerer, J., & Lagrange, X. (2021). Distance-aware relay selection in an energy-efficient discovery protocol for 5G D2D communication. IEEE Transactions on Wireless Communications, 20(7), 4379\u20134391. https:\/\/doi.org\/10.1109\/TWC.2021.3058636","journal-title":"IEEE Transactions on Wireless Communications"},{"key":"11753_CR16","doi-asserted-by":"publisher","first-page":"744","DOI":"10.1109\/ICESC48915.2020.9155595","volume":"2020","author":"D Prabakar","year":"2020","unstructured":"Prabakar, D., Lakshmy, N., & Vishnu, S. (2020). Dynamic channel state information based relay selection in device-to-device communication. International conference on electronics and sustainable communication systems (ICESC),2020, 744\u2013747. https:\/\/doi.org\/10.1109\/ICESC48915.2020.9155595","journal-title":"International Conference on Electronics and Sustainable Communication Systems (ICESC)"},{"issue":"9","key":"11753_CR17","doi-asserted-by":"publisher","first-page":"8303","DOI":"10.1109\/TVT.2017.2682123","volume":"66","author":"R Ma","year":"2017","unstructured":"Ma, R., Chang, Y.-J., Chen, H.-H., & Chiu, C.-Y. (2017). On relay selection schemes for relay-assisted D2D communications in LTE-A systems. IEEE Transactions on Vehicular Technology, 66(9), 8303\u20138314. https:\/\/doi.org\/10.1109\/TVT.2017.2682123","journal-title":"IEEE Transactions on Vehicular Technology"},{"key":"11753_CR18","doi-asserted-by":"publisher","unstructured":"Woo, W. H., Annur, R., & Ponnusamy, V. (2021). Performance evaluation for relay selection on device-to-device (D2D) communications in rayleigh fading, 2021 3rd international conference on advancements in computing (ICAC), pp. 140-145, https:\/\/doi.org\/10.1109\/ICAC54203.2021.9671128.","DOI":"10.1109\/ICAC54203.2021.9671128."},{"issue":"10","key":"11753_CR19","doi-asserted-by":"publisher","first-page":"143","DOI":"10.30534\/ijeter\/2024\/0112102024","volume":"12","author":"M Sirma","year":"2024","unstructured":"Sirma, M., Kavak, A., & Inner, A. B. (2024). Relay assisted device-to-device communication for future generation wireless networks: A review from architectural and challenges perspective. International Journal of Emerging Trends in Engineering Research, 12(10), 143\u2013152. https:\/\/doi.org\/10.30534\/ijeter\/2024\/0112102024","journal-title":"International Journal of Emerging Trends in Engineering Research"},{"issue":"12","key":"11753_CR20","doi-asserted-by":"publisher","first-page":"15800","DOI":"10.1109\/TVT.2020.3036489","volume":"69","author":"Y Li","year":"2020","unstructured":"Li, Y., Xu, G., Yang, K., Ge, J., Liu, P., & Jin, Z. (2020). Energy efficient relay selection and resource allocation in D2D-enabled mobile edge computing. IEEE Transactions on Vehicular Technology, 69(12), 15800\u201315814. https:\/\/doi.org\/10.1109\/TVT.2020.3036489","journal-title":"IEEE Transactions on Vehicular Technology"},{"key":"11753_CR21","doi-asserted-by":"publisher","unstructured":"Liu, M., Zhang, L., & Gautam, P. R. (2019). Joint Relay selection and resource allocation for relay-assisted D2D underlay communications, 2019 22nd international symposium on wireless personal multimedia communications (WPMC) pp. 1-6, https:\/\/doi.org\/10.1109\/WPMC48795.2019.9096172.","DOI":"10.1109\/WPMC48795.2019.9096172."},{"key":"11753_CR22","doi-asserted-by":"publisher","unstructured":"Kumarapandian, S., & Ahmed, Q. Z. (2021). Performance analysis of double-threshold based multi-relay selection with differential modulation for cooperative D2D network, 2021 IEEE 11th annual computing and communication workshop and conference (CCWC), pp. 1343-1346, https:\/\/doi.org\/10.1109\/CCWC51732.2021.9375930.","DOI":"10.1109\/CCWC51732.2021.9375930."},{"issue":"2","key":"11753_CR23","doi-asserted-by":"publisher","first-page":"2141","DOI":"10.1109\/TVT.2019.2960506","volume":"69","author":"J Chen","year":"2020","unstructured":"Chen, J., Zhang, L., Liang, Y.-C., & Ma, S. (2020). Optimal resource allocation for multicarrier NOMA in short packet communications. IEEE Transactions on Vehicular Technology, 69(2), 2141\u20132156. https:\/\/doi.org\/10.1109\/TVT.2019.2960506","journal-title":"IEEE Transactions on Vehicular Technology"},{"key":"11753_CR24","doi-asserted-by":"publisher","unstructured":"Abdelreheem, A., Omer, O. A., Esmaiel, H., & Mohamed, U. S. (2019). Deep Learning-based relay selection in D2D Wave Communications. international conference on computer and information sciences (ICCIS),2019, 1\u20135. https:\/\/doi.org\/10.1109\/ICCISci.2019.8716458","DOI":"10.1109\/ICCISci.2019.8716458"},{"key":"11753_CR25","doi-asserted-by":"publisher","unstructured":"Zia, K., Javed, N., Sial, M. N., Ahmed, S., & Pervez, F. (2018). Multi-agent RL based user-centric spectrum allocation scheme in D2D enabled hetnets IEEE 23rd international workshop on computer aided modeling and design of communication links and networks (CAMAD)Barcelona, 2018, 1\u20136. https:\/\/doi.org\/10.1109\/CAMAD.2018.8514983","DOI":"10.1109\/CAMAD.2018.8514983"},{"key":"11753_CR26","doi-asserted-by":"publisher","first-page":"6733","DOI":"10.1109\/ACCESS.2018.2890210","volume":"7","author":"K Zia","year":"2019","unstructured":"Zia, K., Javed, N., Sial, M. N., Ahmed, S., Pirzada, A. A., & Pervez, F. (2019). A distributed multi-agent rl-based autonomous spectrum allocation scheme in D2D enabled multi-tier hetnets. IEEE Access, 7, 6733\u20136745. https:\/\/doi.org\/10.1109\/ACCESS.2018.2890210","journal-title":"IEEE Access"},{"issue":"3","key":"11753_CR27","doi-asserted-by":"publisher","first-page":"416","DOI":"10.1109\/LWC.2019.2958814","volume":"9","author":"H Zhang","year":"2020","unstructured":"Zhang, H., Chong, S., Zhang, X., & Lin, N. (2020). A Deep reinforcement learning based D2D relay selection and power level allocation in mmwave vehicular networks. IEEE Wireless Communications Letters, 9(3), 416\u2013419. https:\/\/doi.org\/10.1109\/LWC.2019.2958814","journal-title":"IEEE Wireless Communications Letters"},{"key":"11753_CR28","doi-asserted-by":"publisher","unstructured":"Toumi, S., Hamdi, M., & Zaied, M. (2018). An adaptive Q-learning approach to power control for D2D communications, 2018 international conference on advanced systems and electric technologies (IC_ASET), Hammamet, pp. 206-209, https:\/\/doi.org\/10.1109\/ASET.2018.8379860.","DOI":"10.1109\/ASET.2018.8379860."},{"key":"11753_CR29","doi-asserted-by":"publisher","first-page":"164533","DOI":"10.1109\/ACCESS.2019.2952411","volume":"7","author":"KK Nguyen","year":"2019","unstructured":"Nguyen, K. K., Duong, T. Q., Vien, N. A., Le-Khac, N., & Nguyen, L. D. (2019). Distributed deep deterministic policy gradient for power allocation control in D2D-Based V2V communications. IEEE Access, 7, 164533\u2013164543. https:\/\/doi.org\/10.1109\/ACCESS.2019.2952411","journal-title":"IEEE Access"},{"key":"11753_CR30","doi-asserted-by":"publisher","first-page":"3143","DOI":"10.1109\/JIOT.2020.3014926","volume":"8","author":"I Budhiraja","year":"2020","unstructured":"Budhiraja, I., Kumar, N., & Tyagi, S.Deep reinforcement learning based proportional fair scheduling control scheme for underlay D2D communication, IEEE Internet of Things Journal 8, 3143,https:\/\/doi.org\/10.1109\/JIOT.2020.3014926.","journal-title":"IEEE Internet of Things Journal"},{"key":"11753_CR31","doi-asserted-by":"publisher","unstructured":"Park, H., & Lim, Y. (2020). Adaptive power control using reinforcement learning in 5G mobile networks, 2020 international conference on information networking (ICOIN), Barcelona, Spain, 409-414, https:\/\/doi.org\/10.1109\/ICOIN48656.2020.9016566.","DOI":"10.1109\/ICOIN48656.2020.9016566."},{"key":"11753_CR32","doi-asserted-by":"publisher","unstructured":"Qi, Y., & Geng, S. (2023). \u201cDeep-reinforcement-learning-based resource allocation for energy harvesting D2D communication,\u201d 2023 4th international conference on electronic communication and artificial intelligence (ICECAI), Guangzhou, China, 85-88, https:\/\/doi.org\/10.1109\/ICECAI58670.2023.10176743.","DOI":"10.1109\/ICECAI58670.2023.10176743."},{"issue":"6","key":"11753_CR33","doi-asserted-by":"publisher","first-page":"6452","DOI":"10.1109\/TVT.2020.2985873","volume":"69","author":"X Wang","year":"2020","unstructured":"Wang, X., Jin, T., Hu, L., & Qian, Z. (2020). Energy-efficient power allocation and q-learning-based relay selection for relay-aided D2D communication. IEEE Transactions on Vehicular Technology, 69(6), 6452\u20136462. https:\/\/doi.org\/10.1109\/TVT.2020.2985873","journal-title":"IEEE Transactions on Vehicular Technology"},{"key":"11753_CR34","doi-asserted-by":"publisher","unstructured":"Routray, R., & Patra, T. K. (2014). Reinforcement learning based path selection in multi-hop device to device communication,\u201d 2024 first international conference on electronics, communication and signal processing (ICECSP), New Delhi, India, pp. 1-5, https:\/\/doi.org\/10.1109\/ICECSP61809.2024.10698102.","DOI":"10.1109\/ICECSP61809.2024.10698102."},{"key":"11753_CR35","doi-asserted-by":"publisher","unstructured":"Gandotra, Pimmy, & Kumar Jha, Rakesh. (2016). Device-to-device communication in cellular networks: A Survey, Journal of Network and Computer Applications,71, 99-117https:\/\/doi.org\/10.1016\/j.jnca.2016.06.004.","DOI":"10.1016\/j.jnca.2016.06.004."},{"key":"11753_CR36","doi-asserted-by":"publisher","unstructured":"AlQerm, I., & Shihada, B. (2016). A cooperative online learning scheme for resource allocation in 5G systems, 2016 IEEE international conference on communications (ICC), Kuala Lumpur pp. 1-7, https:\/\/doi.org\/10.1109\/ICC.2016.7511617.","DOI":"10.1109\/ICC.2016.7511617."},{"key":"11753_CR37","doi-asserted-by":"publisher","unstructured":"Pupo, E. F., Gonz\u00e1lez, C. C., Iradier, E., Montalban, J., & Murroni, M. (2023). 5G link-level simulator for multicast\/broadcast services, IEEE international symposium on broadband multimedia systems and broadcasting (BMSB). Beijing, China, 2023, 1\u20136. https:\/\/doi.org\/10.1109\/BMSB58369.2023.10211507","DOI":"10.1109\/BMSB58369.2023.10211507"}],"container-title":["Wireless Personal Communications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11277-025-11753-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11277-025-11753-z\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11277-025-11753-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,19]],"date-time":"2025-05-19T06:02:38Z","timestamp":1747634558000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11277-025-11753-z"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,2]]},"references-count":37,"journal-issue":{"issue":"3-4","published-print":{"date-parts":[[2025,2]]}},"alternative-id":["11753"],"URL":"https:\/\/doi.org\/10.1007\/s11277-025-11753-z","relation":{"has-preprint":[{"id-type":"doi","id":"10.21203\/rs.3.rs-4597667\/v1","asserted-by":"object"}]},"ISSN":["0929-6212","1572-834X"],"issn-type":[{"value":"0929-6212","type":"print"},{"value":"1572-834X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,2]]},"assertion":[{"value":"7 March 2025","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 April 2025","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have not disclosed any competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}]}}