{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,27]],"date-time":"2025-10-27T16:16:55Z","timestamp":1761581815037,"version":"3.37.3"},"reference-count":41,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"7","license":[{"start":{"date-parts":[[2019,7,1]],"date-time":"2019-07-01T00:00:00Z","timestamp":1561939200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2019,7,1]],"date-time":"2019-07-01T00:00:00Z","timestamp":1561939200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2019,7,1]],"date-time":"2019-07-01T00:00:00Z","timestamp":1561939200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100002858","name":"China Postdoctoral Science Foundation","doi-asserted-by":"publisher","award":["2018M640079"],"award-info":[{"award-number":["2018M640079"]}],"id":[{"id":"10.13039\/501100002858","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61801025","61771054"],"award-info":[{"award-number":["61801025","61771054"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Veh. Technol."],"published-print":{"date-parts":[[2019,7]]},"DOI":"10.1109\/tvt.2019.2909055","type":"journal-article","created":{"date-parts":[[2019,4,3]],"date-time":"2019-04-03T22:18:36Z","timestamp":1554329916000},"page":"6891-6902","source":"Crossref","is-referenced-by-count":28,"title":["Buffer-Aware Streaming in Small-Scale Wireless Networks: A Deep Reinforcement Learning Approach"],"prefix":"10.1109","volume":"68","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8870-9046","authenticated-orcid":false,"given":"Yashuang","family":"Guo","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1006-7594","authenticated-orcid":false,"given":"F. Richard","family":"Yu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6441-9711","authenticated-orcid":false,"given":"Jianping","family":"An","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1059-0705","authenticated-orcid":false,"given":"Kai","family":"Yang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7079-8682","authenticated-orcid":false,"given":"Ying","family":"He","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3529-2640","authenticated-orcid":false,"given":"Victor C. M.","family":"Leung","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref39","first-page":"197","author":"mao","year":"0","journal-title":"Proc ACM Special Interest Group on Communications Conf"},{"article-title":"Hierarchical deep reinforcement learning: Integrating temporal abstraction and intrinsic motivation","year":"0","author":"kulkarni","key":"ref38"},{"article-title":"Adam: A method for stochastic optimization","year":"2017","author":"kingma","key":"ref33"},{"year":"0","key":"ref32","article-title":"Tensorflow.org."},{"article-title":"TensorFlow: Large-scale machine learning on heterogeneous systems","year":"2016","author":"abadi","key":"ref31"},{"article-title":"Massively parallel methods for deep reinforcement learning","year":"2015","author":"nair","key":"ref30"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2018.2805379"},{"key":"ref36","first-page":"257","article-title":"iDASH: Improved dynamic adaptive streaming over HTTP using scalable video coding","author":"sanchez","year":"0","journal-title":"Proc of ACM Multimedia Systems"},{"article-title":"Continuous control with deep reinforcement learning","year":"2016","author":"lillicrapc","key":"ref35"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2017.2751641"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TNET.2018.2879979"},{"key":"ref40","article-title":"Asynchronous methods for deep reinforcement learning","author":"mnih","year":"0","journal-title":"Proc 33 rd Int Conf Mach Learn"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2009.2036294"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2011.2160158"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2011.110516"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2015.2437071"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/GLOCOM.2007.991"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2013.2284894"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2015.2441708"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TNN.1998.712192"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/25.790549"},{"key":"ref28","first-page":"1057","article-title":"Policy gradient methods for reinforcement learning with function approximation","author":"sutton","year":"0","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref4","doi-asserted-by":"crossref","first-page":"1331","DOI":"10.1109\/TMM.2009.2030543","article-title":"Smooth control of adaptive media playout for video streaming","volume":"11","author":"su","year":"2009","journal-title":"IEEE Trans Multimedia"},{"key":"ref27","volume":"i ii","author":"bertsekas","year":"2011","journal-title":"Dynamic Programming and Optimal Control"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2012.56"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/2785956.2787486"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2017.2724060"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2016.2519882"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2017.2695738"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2015.2494218"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.2017.1601142"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TMECH.2018.2812643"},{"year":"2018","key":"ref1","article-title":"Cisco visual networking index: Global mobile data traffic forecast update 2016&#x2013;2021"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/WCNC.2014.6953124"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511841224"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1038\/nature14236"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/25.350282"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.2017.1700410"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2017.2735301"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/26.803503"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2008.926683"}],"container-title":["IEEE Transactions on Vehicular Technology"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/25\/8764674\/08681145.pdf?arnumber=8681145","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,7,13]],"date-time":"2022-07-13T21:08:05Z","timestamp":1657746485000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8681145\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,7]]},"references-count":41,"journal-issue":{"issue":"7"},"URL":"https:\/\/doi.org\/10.1109\/tvt.2019.2909055","relation":{},"ISSN":["0018-9545","1939-9359"],"issn-type":[{"type":"print","value":"0018-9545"},{"type":"electronic","value":"1939-9359"}],"subject":[],"published":{"date-parts":[[2019,7]]}}}