{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,20]],"date-time":"2026-03-20T15:44:33Z","timestamp":1774021473475,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":25,"publisher":"ACM","license":[{"start":{"date-parts":[[2021,7,2]],"date-time":"2021-07-02T00:00:00Z","timestamp":1625184000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"Shenzhen Science and Technology Program","award":["Grant No. RCYX20200714114523079"],"award-info":[{"award-number":["Grant No. RCYX20200714114523079"]}]},{"name":"NSFC","award":["Grant No. 61936011?No. 61521002?No. 61872215"],"award-info":[{"award-number":["Grant No. 61936011?No. 61521002?No. 61872215"]}]},{"name":"Beijing Key Lab of Networked Multimedia"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2021,7,16]]},"DOI":"10.1145\/3458306.3460995","type":"proceedings-article","created":{"date-parts":[[2021,6,30]],"date-time":"2021-06-30T21:32:58Z","timestamp":1625088778000},"page":"34-41","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":16,"title":["PAAS"],"prefix":"10.1145","author":[{"given":"Chenglei","family":"Wu","sequence":"first","affiliation":[{"name":"Beijing Key Lab of Networked Multimedia"}]},{"given":"Zhi","family":"Wang","sequence":"additional","affiliation":[{"name":"Tsinghua University"}]},{"given":"Lifeng","family":"Sun","sequence":"additional","affiliation":[{"name":"Beijing Key Lab of Networked Multimedia and Tsinghua University and Ministry of Education, China"}]}],"member":"320","published-online":{"date-parts":[[2021,7,2]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1145\/3123266.3123414"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1145\/3083187.3083190"},{"key":"e_1_3_2_1_3_1","first-page":"564","volume-title":"Cls: A cross-user learning based system for improving qoe in 360-degree video adaptive streaming,\" in Proceedings of the 26th ACM international conference on Multimedia","author":"Xie L.","year":"2018","unstructured":"L. Xie , X. Zhang , and Z. Guo , \" Cls: A cross-user learning based system for improving qoe in 360-degree video adaptive streaming,\" in Proceedings of the 26th ACM international conference on Multimedia , 2018 , pp. 564 -- 572 . L. Xie, X. Zhang, and Z. Guo, \"Cls: A cross-user learning based system for improving qoe in 360-degree video adaptive streaming,\" in Proceedings of the 26th ACM international conference on Multimedia, 2018, pp. 564--572."},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/3123266.3123372"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1145\/3123266.3123453"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/3123266.3123339"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1145\/3123266.3123291"},{"key":"e_1_3_2_1_8_1","first-page":"962","volume-title":"IEEE","author":"Zhou C.","year":"2018","unstructured":"C. Zhou , M. Xiao , and Y. Liu , \" Clustile: Toward minimizing bandwidth in 360-degree video streaming,\" in IEEE INFOCOM 2018-IEEE Conference on Computer Communications . IEEE , 2018 , pp. 962 -- 970 . C. Zhou, M. Xiao, and Y. Liu, \"Clustile: Toward minimizing bandwidth in 360-degree video streaming,\" in IEEE INFOCOM 2018-IEEE Conference on Computer Communications. IEEE, 2018, pp. 962--970."},{"key":"e_1_3_2_1_9_1","volume-title":"IEEE","author":"Zhang Y.","year":"2019","unstructured":"Y. Zhang , P. Zhao , K. Bian , Y. Liu , L. Song , and X. Li , \" Drl360: 360-degree video streaming with deep reinforcement learning,\" in IEEE INFOCOM 2019-IEEE Conference on Computer Communications . IEEE , 2019 . Y. Zhang, P. Zhao, K. Bian, Y. Liu, L. Song, and X. Li, \"Drl360: 360-degree video streaming with deep reinforcement learning,\" in IEEE INFOCOM 2019-IEEE Conference on Computer Communications. IEEE, 2019."},{"key":"e_1_3_2_1_10_1","first-page":"290","volume-title":"IEEE","author":"Fu J.","year":"2019","unstructured":"J. Fu , X. Chen , Z. Zhang , S. Wu , and Z. Chen , \" 360srl: A sequential reinforcement learning approach for abr tile-based 360 video streaming,\" in 2019 IEEE International Conference on Multimedia and Expo (ICME) . IEEE , 2019 , pp. 290 -- 295 . J. Fu, X. Chen, Z. Zhang, S. Wu, and Z. Chen, \"360srl: A sequential reinforcement learning approach for abr tile-based 360 video streaming,\" in 2019 IEEE International Conference on Multimedia and Expo (ICME). IEEE, 2019, pp. 290--295."},{"key":"e_1_3_2_1_11_1","first-page":"4030","volume-title":"Speech and Signal Processing (ICASSP)","author":"Kan N.","year":"2019","unstructured":"N. Kan , J. Zou , K. Tang , C. Li , N. Liu , and H. Xiong , \" Deep reinforcement learning-based rate adaptation for adaptive 360-degree video streaming,\" in ICASSP 2019 - 2019 IEEE International Conference on Acoustics , Speech and Signal Processing (ICASSP) , May 2019 , pp. 4030 -- 4034 . N. Kan, J. Zou, K. Tang, C. Li, N. Liu, and H. Xiong, \"Deep reinforcement learning-based rate adaptation for adaptive 360-degree video streaming,\" in ICASSP 2019 - 2019 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), May 2019, pp. 4030--4034."},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1145\/3204949.3204970"},{"key":"e_1_3_2_1_13_1","first-page":"601","volume-title":"Dynamic preferences in multi-criteria reinforcement learning,\" in Proceedings of the 22nd international conference on Machine learning","author":"Natarajan S.","year":"2005","unstructured":"S. Natarajan and P. Tadepalli , \" Dynamic preferences in multi-criteria reinforcement learning,\" in Proceedings of the 22nd international conference on Machine learning , 2005 , pp. 601 -- 608 . S. Natarajan and P. Tadepalli, \"Dynamic preferences in multi-criteria reinforcement learning,\" in Proceedings of the 22nd international conference on Machine learning, 2005, pp. 601--608."},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.5555\/2627435.2750356"},{"key":"e_1_3_2_1_15_1","first-page":"14636","volume-title":"A generalized algorithm for multi-objective reinforcement learning and policy adaptation,\" in Advances in Neural Information Processing Systems 32","author":"Yang R.","year":"2019","unstructured":"R. Yang , X. Sun , and K. Narasimhan , \" A generalized algorithm for multi-objective reinforcement learning and policy adaptation,\" in Advances in Neural Information Processing Systems 32 , H. Wallach, H. Larochelle, A. Beygelzimer, F. deBuc, E. Fox, and R. Garnett, Eds. Curran Associates, Inc. , 2019 , pp. 14636 -- 14647 . R. Yang, X. Sun, and K. Narasimhan, \"A generalized algorithm for multi-objective reinforcement learning and policy adaptation,\" in Advances in Neural Information Processing Systems 32, H. Wallach, H. Larochelle, A. Beygelzimer, F. deBuc, E. Fox, and R. Garnett, Eds. Curran Associates, Inc., 2019, pp. 14636--14647."},{"key":"e_1_3_2_1_16_1","first-page":"197","volume-title":"ACM","author":"Mao H.","year":"2017","unstructured":"H. Mao , R. Netravali , and M. Alizadeh , \" Neural adaptive video streaming with pensieve,\" in Proceedings of the Conference of the ACM Special Interest Group on Data Communication . ACM , 2017 , pp. 197 -- 210 . H. Mao, R. Netravali, and M. Alizadeh, \"Neural adaptive video streaming with pensieve,\" in Proceedings of the Conference of the ACM Special Interest Group on Data Communication. ACM, 2017, pp. 197--210."},{"key":"e_1_3_2_1_17_1","first-page":"1995","volume-title":"Dueling network architectures for deep reinforcement learning,\" in International conference on machine learning","author":"Wang Z.","year":"2016","unstructured":"Z. Wang , T. Schaul , M. Hessel , H. Hasselt , M. Lanctot , and N. Freitas , \" Dueling network architectures for deep reinforcement learning,\" in International conference on machine learning , 2016 , pp. 1995 -- 2003 . Z. Wang, T. Schaul, M. Hessel, H. Hasselt, M. Lanctot, and N. Freitas, \"Dueling network architectures for deep reinforcement learning,\" in International conference on machine learning, 2016, pp. 1995--2003."},{"key":"e_1_3_2_1_18_1","first-page":"11","article-title":"Dynamic weights in multi-objective deep reinforcement learning","author":"Abels A.","year":"2019","unstructured":"A. Abels , D. Roijers , T. Lenaerts , A. Now\u00e9 , and D. Steckelmacher , \" Dynamic weights in multi-objective deep reinforcement learning ,\" in International Conference on Machine Learning , 2019 , pp. 11 -- 20 . A. Abels, D. Roijers, T. Lenaerts, A. Now\u00e9, and D. Steckelmacher, \"Dynamic weights in multi-objective deep reinforcement learning,\" in International Conference on Machine Learning, 2019, pp. 11--20.","journal-title":"International Conference on Machine Learning"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1162\/neco_a_01232"},{"key":"e_1_3_2_1_20_1","volume-title":"An empirical investigation of catastrophic forgetting in gradient-based neural networks,\" arXiv preprint arXiv:1312.6211","author":"Goodfellow I. J.","year":"2013","unstructured":"I. J. Goodfellow , M. Mirza , D. Xiao , A. Courville , and Y. Bengio , \" An empirical investigation of catastrophic forgetting in gradient-based neural networks,\" arXiv preprint arXiv:1312.6211 , 2013 . I. J. Goodfellow, M. Mirza, D. Xiao, A. Courville, and Y. Bengio, \"An empirical investigation of catastrophic forgetting in gradient-based neural networks,\" arXiv preprint arXiv:1312.6211, 2013."},{"key":"e_1_3_2_1_21_1","volume-title":"Prioritized experience replay,\" arXiv preprint arXiv:1511.05952","author":"Schaul T.","year":"2015","unstructured":"T. Schaul , J. Quan , I. Antonoglou , and D. Silver , \" Prioritized experience replay,\" arXiv preprint arXiv:1511.05952 , 2015 . T. Schaul, J. Quan, I. Antonoglou, and D. Silver, \"Prioritized experience replay,\" arXiv preprint arXiv:1511.05952, 2015."},{"key":"e_1_3_2_1_22_1","first-page":"114","volume-title":"Commute path bandwidth traces from 3g networks: analysis and applications,\" in Proceedings of the 4th ACM Multimedia Systems Conference","author":"Riiser H.","year":"2013","unstructured":"H. Riiser , P. Vigmostad , C. Griwodz , and P. Halvorsen , \" Commute path bandwidth traces from 3g networks: analysis and applications,\" in Proceedings of the 4th ACM Multimedia Systems Conference , 2013 , pp. 114 -- 118 . H. Riiser, P. Vigmostad, C. Griwodz, and P. Halvorsen, \"Commute path bandwidth traces from 3g networks: analysis and applications,\" in Proceedings of the 4th ACM Multimedia Systems Conference, 2013, pp. 114--118."},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/3083187.3083210"},{"key":"e_1_3_2_1_24_1","first-page":"1161","volume-title":"IEEE","author":"Bao Y.","year":"2016","unstructured":"Y. Bao , H. Wu , T. Zhang , A. A. Ramli , and X. Liu , \" Shooting a moving target: Motion-prediction-based transmission for 360-degree videos,\" in 2016 IEEE International Conference on Big Data (Big Data) . IEEE , 2016 , pp. 1161 -- 1170 . Y. Bao, H. Wu, T. Zhang, A. A. Ramli, and X. Liu, \"Shooting a moving target: Motion-prediction-based transmission for 360-degree videos,\" in 2016 IEEE International Conference on Big Data (Big Data). IEEE, 2016, pp. 1161--1170."},{"key":"e_1_3_2_1_25_1","volume-title":"Rainbow: Combining improvements in deep reinforcement learning,\" in Thirty-Second AAAI Conference on Artificial Intelligence","author":"Hessel M.","year":"2018","unstructured":"M. Hessel , J. Modayil , H. Van Hasselt , T. Schaul , G. Ostrovski , W. Dabney , D. Horgan , B. Piot , M. Azar , and D. Silver , \" Rainbow: Combining improvements in deep reinforcement learning,\" in Thirty-Second AAAI Conference on Artificial Intelligence , 2018 . M. Hessel, J. Modayil, H. Van Hasselt, T. Schaul, G. Ostrovski, W. Dabney, D. Horgan, B. Piot, M. Azar, and D. Silver, \"Rainbow: Combining improvements in deep reinforcement learning,\" in Thirty-Second AAAI Conference on Artificial Intelligence, 2018."}],"event":{"name":"MMSys '21: 12th ACM Multimedia Systems Conference","location":"Istanbul Turkey","acronym":"MMSys '21","sponsor":["SIGMM ACM Special Interest Group on Multimedia","SIGCOMM ACM Special Interest Group on Data Communication","SIGMOBILE ACM Special Interest Group on Mobility of Systems, Users, Data and Computing"]},"container-title":["Proceedings of the 31st ACM Workshop on Network and Operating Systems Support for Digital Audio and Video"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3458306.3460995","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3458306.3460995","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T21:28:19Z","timestamp":1750195699000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3458306.3460995"}},"subtitle":["a preference-aware deep reinforcement learning approach for 360\u00b0 video streaming"],"short-title":[],"issued":{"date-parts":[[2021,7,2]]},"references-count":25,"alternative-id":["10.1145\/3458306.3460995","10.1145\/3458306"],"URL":"https:\/\/doi.org\/10.1145\/3458306.3460995","relation":{},"subject":[],"published":{"date-parts":[[2021,7,2]]},"assertion":[{"value":"2021-07-02","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}