{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,13]],"date-time":"2026-01-13T21:21:43Z","timestamp":1768339303902,"version":"3.49.0"},"reference-count":42,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"9","license":[{"start":{"date-parts":[[2024,9,1]],"date-time":"2024-09-01T00:00:00Z","timestamp":1725148800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2024,9,1]],"date-time":"2024-09-01T00:00:00Z","timestamp":1725148800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,9,1]],"date-time":"2024-09-01T00:00:00Z","timestamp":1725148800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"Urmia University, Urmia, Iran"},{"name":"Mobile Telecommunication Company of Iran"},{"name":"Research and Development, Tehran, Iran","award":["DR-51-0011-0030"],"award-info":[{"award-number":["DR-51-0011-0030"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Veh. Technol."],"published-print":{"date-parts":[[2024,9]]},"DOI":"10.1109\/tvt.2024.3386587","type":"journal-article","created":{"date-parts":[[2024,4,24]],"date-time":"2024-04-24T17:26:34Z","timestamp":1713979594000},"page":"12962-12977","source":"Crossref","is-referenced-by-count":9,"title":["Joint Power Allocation and User Fairness Optimization for Reinforcement Learning Over mmWave-NOMA Heterogeneous Networks"],"prefix":"10.1109","volume":"73","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-7264-4062","authenticated-orcid":false,"given":"Sima","family":"Sobhi-Givi","sequence":"first","affiliation":[{"name":"Electrical and Computer Engineering Department, Urmia University, Urmia, Iran"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4901-9859","authenticated-orcid":false,"given":"Mahdi","family":"Nouri","sequence":"additional","affiliation":[{"name":"Electrical Engineering Department, Sharif University of Technology, Tehran, Iran"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9888-1261","authenticated-orcid":false,"given":"Mahrokh G.","family":"Shayesteh","sequence":"additional","affiliation":[{"name":"Electrical and Computer Engineering Department, Urmia University, Urmia, Iran"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2431-4920","authenticated-orcid":false,"given":"Hashem","family":"Kalbkhani","sequence":"additional","affiliation":[{"name":"Faculty of Electrical Engineering, Urmia University of Technology, Urmia, Iran"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5280-384X","authenticated-orcid":false,"given":"Zhiguo","family":"Ding","sequence":"additional","affiliation":[{"name":"Electrical Engineering Department and Computer Science, Khalifa University, Abu Dhabi, UAE"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/OJCOMS.2020.2969899"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1155\/2019\/1914762"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/VTCFall.2018.8690681"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2020.3041020"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2017.2725519"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2020.3003062"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2017.2673248"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2017.2725878"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2017.2699059"},{"issue":"2","key":"ref10","first-page":"814","article-title":"An analysis of Q-learning algorithms with strategies of reward function","volume":"3","author":"Manju","year":"2011","journal-title":"Int. J. Comput. Sci. Eng."},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1126\/science.aaa8415"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-62703-748-8_7"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2018.2867180"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.3390\/s20247094"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICTC49870.2020.9289376"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICCSE.2014.6926537"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/VTCFall.2013.6692057"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TNSE.2020.3004333"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1049\/cmu2.12177"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2022.3159612"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2019.2926757"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TCOMM.2017.2779150"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ICC.2018.8422363"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/JSYST.2019.2937463"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2020.3000192"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/SII52469.2022.9708805"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2013.130509"},{"key":"ref28","article-title":"Guidelines for evaluation of radio interface technologies for IMT-2020","author":"Series","year":"2017"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1023\/A:1016200519958"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2016.2543733"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/90.879343"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2016.2583421"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1080\/23311916.2018.1502242"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TSP.2016.2614794"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.3390\/su12020687"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1007\/s00158-009-0460-7"},{"issue":"2","key":"ref37","first-page":"455","article-title":"Effective implementation of the $\\varepsilon$-constraint method in multi-objective mathematical programming problems","volume":"213","author":"Mavrotas","year":"2009","journal-title":"Appl. Math. Comput."},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511804441"},{"key":"ref39","volume-title":"Reinforcement Learning: An Introduction","author":"Sutton","year":"2018"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.32604\/cmc.2022.021917"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-13-8285-7_13"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2017.2782726"}],"container-title":["IEEE Transactions on Vehicular Technology"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/25\/10683799\/10508101.pdf?arnumber=10508101","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,19]],"date-time":"2024-09-19T06:46:16Z","timestamp":1726728376000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10508101\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,9]]},"references-count":42,"journal-issue":{"issue":"9"},"URL":"https:\/\/doi.org\/10.1109\/tvt.2024.3386587","relation":{},"ISSN":["0018-9545","1939-9359"],"issn-type":[{"value":"0018-9545","type":"print"},{"value":"1939-9359","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,9]]}}}