{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,25]],"date-time":"2026-01-25T02:20:01Z","timestamp":1769307601193,"version":"3.49.0"},"reference-count":55,"publisher":"Springer Science and Business Media LLC","issue":"13","license":[{"start":{"date-parts":[[2022,12,15]],"date-time":"2022-12-15T00:00:00Z","timestamp":1671062400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2022,12,15]],"date-time":"2022-12-15T00:00:00Z","timestamp":1671062400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2023,5]]},"DOI":"10.1007\/s11042-022-14231-x","type":"journal-article","created":{"date-parts":[[2022,12,15]],"date-time":"2022-12-15T20:04:20Z","timestamp":1671134660000},"page":"20079-20100","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":8,"title":["Proximal policy optimization based hybrid recommender systems for large scale recommendations"],"prefix":"10.1007","volume":"82","author":[{"given":"Vaibhav","family":"Padhye","sequence":"first","affiliation":[]},{"given":"Kailasam","family":"Lakshmanan","sequence":"additional","affiliation":[]},{"given":"Amrita","family":"Chaturvedi","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,12,15]]},"reference":[{"key":"14231_CR1","unstructured":"Akerkar B, Sajja P (2010) Knowledge-based systems. MIT press Cambridge, 978-0763776473"},{"key":"14231_CR2","first-page":"829","volume":"171","author":"MF Aljunid","year":"2020","unstructured":"Aljunid MF, Manjaiah DH (2020) An efficient deep learning approach for collaborative filtering recommender system procedia computer science. Third International Conference on Computing and Network Communications (CoCoNet\u201919) 171:829\u2013836","journal-title":"Third International Conference on Computing and Network Communications (CoCoNet\u201919)"},{"key":"14231_CR3","doi-asserted-by":"publisher","first-page":"26","DOI":"10.1109\/MSP.2017.2743240","volume":"2","author":"K Arulkumaran","year":"2017","unstructured":"Arulkumaran K, Deisenroth MP, Brundage M, Bharath AA (2017) A brief survey of deep reinforcement learning. IEEE Signal Proc Mag 2:26\u201338","journal-title":"IEEE Signal Proc Mag"},{"key":"14231_CR4","doi-asserted-by":"crossref","unstructured":"Bhatti UA, Huang M, Wang H, Zhang Y, Mehmood A, Wu D (2018) Recommendation system for immunization coverage and monitoring. Human Vaccines & Immunotherapeutics, 165\u2013171","DOI":"10.1080\/21645515.2017.1379639"},{"key":"14231_CR5","doi-asserted-by":"crossref","unstructured":"Bhatti UA, Huang M, Wu D, Zhang Y, Mehmood A, Han H (2019) Recommendation system using feature extraction and pattern recognition in clinical care systems. Enterprise Information Systems, 329\u2013351","DOI":"10.1080\/17517575.2018.1557256"},{"key":"14231_CR6","unstructured":"Breese JS, Heckerman D, Kadie C (2013) Empirical analysis of predictive algorithms for collaborative filtering. In: Proceedings of the Fourteenth Conference on Uncertainty in Artificial Intelligence, pp. 43\u201352, UAI\u201998, Madison, Wisconsin"},{"key":"14231_CR7","unstructured":"Brockman G, Cheung V, Pettersson L, Schneider J, Schulman J, Tang J, Zaremba W (2016) Openai Gym. arXiv:1606.01540"},{"key":"14231_CR8","doi-asserted-by":"publisher","first-page":"331","DOI":"10.1023\/A:1021240730564","volume":"12","author":"R Burke","year":"2002","unstructured":"Burke R (2002) Hybrid recommender systems: survey and experiments. User Modeling and User-adapted Interaction 12:331\u2013370","journal-title":"User Modeling and User-adapted Interaction"},{"key":"14231_CR9","doi-asserted-by":"crossref","unstructured":"Chen H (2021) A DQN-based Recommender System for Item-list Recommendation. In: IEEE International Conference on Big Data (Big Data), pp 5699\u20135702","DOI":"10.1109\/BigData52589.2021.9671947"},{"key":"14231_CR10","doi-asserted-by":"crossref","unstructured":"Chen M, Beutel A, Covington P, Jain S, Belletti F, Chi Ed (2019) Top-K Off-Policy Correction for a REINFORCE Recommender System, Association for Computing Machinery, New York, NY, USA, 456\u2013464","DOI":"10.1145\/3289600.3290999"},{"key":"14231_CR11","unstructured":"Chen X, Yao L, McAuley J, Zhou G, Wang X (2021) A survey of deep reinforcement learning in recommender systems: a systematic review and future directions. arXiv:2109.03540"},{"key":"14231_CR12","unstructured":"Dulac-Arnold G, Evans R, Hasselt HV, Sunehag P, Lillicrap T, Hunt J, Mann T, Weber T, Degris T, Coppin B (2015) Reinforcement learning in large discrete action spaces. Corr, abs\/1512.07679"},{"key":"14231_CR13","doi-asserted-by":"crossref","unstructured":"He X, Li L, Zhang H, Nie L, Hu X, Chua TS (2017) Neural collaborative filtering. In: Proceedings of the 26th international conference on world wide web, pp 173\u2013182","DOI":"10.1145\/3038912.3052569"},{"key":"14231_CR14","doi-asserted-by":"crossref","unstructured":"Hu Y, Da Q, Zeng A, Yu Y, Xu Y (2018) Reinforcement learning to rank in e-commerce search engine Formalization, analysis, and application. Corr, abs\/1803.00710","DOI":"10.1145\/3219819.3219846"},{"key":"14231_CR15","doi-asserted-by":"crossref","unstructured":"Koren Y (2008) Factorization meets the neighborhood: a multifaceted collaborative filtering model. In: Association for computing machinery, New York, USA, pp. 426\u2013434","DOI":"10.1145\/1401890.1401944"},{"key":"14231_CR16","doi-asserted-by":"crossref","unstructured":"Li L, Chu W, Langford J, Chapire RE (2010) A contextual-bandit approach to personalized news article recommendation. J Mach Learn Res, 661\u2013670","DOI":"10.1145\/1772690.1772758"},{"key":"14231_CR17","doi-asserted-by":"publisher","first-page":"45451","DOI":"10.1109\/ACCESS.2018.2885084","volume":"7","author":"W Li","year":"2019","unstructured":"Li W, Zhou X, Shimizu S, Xin M, Jiang J, Gao H, Jin Q (2019) Personalization recommendation algorithm based on trust correlation degree and matrix factorization. IEEE Access 7:45451\u201345459","journal-title":"IEEE Access"},{"key":"14231_CR18","doi-asserted-by":"publisher","first-page":"227","DOI":"10.1109\/TCSS.2020.2965234","volume":"8","author":"W Lin","year":"2021","unstructured":"Lin W, Zhang X, Qi L, Li W, Li S, Sheng VS, Nepal S (2021) Location-Aware Service recommendations with Privacy-Preservation in the internet of things. IEEE Trans Comput Social Syst 8:227\u2013235","journal-title":"IEEE Trans Comput Social Syst"},{"key":"14231_CR19","unstructured":"Liu F, Tang R, Li X, Zhang W, Ye Y, Chen H, Guo H, Zhang Y (2018) Deep reinforcement learning based recommenda- tion with explicit user-item interactions modeling, arXiv:1810.12027"},{"key":"14231_CR20","doi-asserted-by":"crossref","unstructured":"Liu Y, Wang S, Khan MS, He J (2018) A novel deep hybrid recommender system based on auto-encoder with neural collaborative filtering. Big Data Mining and Analytics, 211\u2013221","DOI":"10.26599\/BDMA.2018.9020019"},{"key":"14231_CR21","unstructured":"Marlin B (2003) Modeling User Rating Profiles for Collaborative Filtering. MIT Press. Cambridge, MA, USA"},{"key":"14231_CR22","unstructured":"Mnih A, Salakhutdinov R (2008) Probabilistic matrix factorization. NIPS, 1257\u20131264"},{"key":"14231_CR23","doi-asserted-by":"crossref","unstructured":"Mnih A, Salakhutdinov R (2008) Bayesian probabilistic matrix factorization using markov chain monte carlo. ICML, pp. 880\u2013887","DOI":"10.1145\/1390156.1390267"},{"key":"14231_CR24","doi-asserted-by":"crossref","unstructured":"Pan F, Cai Q, Tang P, Zhuang F, He Q (2019) Policy Gradients for Contextual Recommendations. In: Association for Computing Machinery, New York, NY, USA, 1421\u20131431","DOI":"10.1145\/3308558.3313616"},{"key":"14231_CR25","doi-asserted-by":"crossref","unstructured":"Polat H, Du W (2005) SVD-based collaborative filtering with privacy. Association for Computing Machinery, 791\u2013795, New York, NY, USA","DOI":"10.1145\/1066677.1066860"},{"key":"14231_CR26","first-page":"1","volume":"22","author":"A Raffin","year":"2021","unstructured":"Raffin A, Hill A, Gleave A, Kanervisto A, Ernestus M, Dormann N (2021) Stable-Baselines3 reliable reinforcement learning implementations. J Mach Learn Res 22:1\u20138","journal-title":"J Mach Learn Res"},{"key":"14231_CR27","doi-asserted-by":"crossref","unstructured":"Salakhutdinov R, Mnih A, Hinton G (2007) Restricted Boltzmann machines for collaborative filtering. NIPS, 791\u2013798","DOI":"10.1145\/1273496.1273596"},{"key":"14231_CR28","unstructured":"Sarwar B, Karypis G, Konstan J, Riedl J (2017) Item-based collaborative filtering recommendation algorithms. arXiv:1707.06347"},{"key":"14231_CR29","unstructured":"Schulman J, Wolski P, Dhariwal P, Radford A, Klimo O (2017) Proximal policy optimization algorithms. arXiv:1707.06347"},{"key":"14231_CR30","doi-asserted-by":"crossref","unstructured":"Sedhain S, Menon AK, Sanner S, Xie L (2015) Autorec: Autoencoders meet collaborative filtering. In: Proceedings of the 24th International Conference on World Wide Web, WWW \u201915, Companion, New York, NY. USA, 111\u2013112","DOI":"10.1145\/2740908.2742726"},{"key":"14231_CR31","first-page":"1265","volume":"15324435","author":"G Shani","year":"2005","unstructured":"Shani G, Heckerman D, Brafman I (2005) An mdp-based recommender system. J Mach Learn Res 15324435:1265\u20131295","journal-title":"J Mach Learn Res"},{"key":"14231_CR32","doi-asserted-by":"crossref","unstructured":"Singh M (2020) Scalability and sparsity issues in recommender datasets: a survey. Knowl Inf Syst, 1\u201343","DOI":"10.1007\/s10115-018-1254-2"},{"key":"14231_CR33","doi-asserted-by":"crossref","unstructured":"Srivihok A, Sukonmanee P (2005) E-Commerce intelligent agent personalization travel support agent using q learning. In: Association for Computing Machinery, New York, NY USA","DOI":"10.1145\/1089551.1089606"},{"key":"14231_CR34","unstructured":"Sutton R (1998) Reinforcement learning: an introduction. vol. 1, no. 1., MIT press Cambridge"},{"key":"14231_CR35","unstructured":"Sutton R, Singh S, McAllester D (2000) Comparing policy-gradient algorithms. IEEE Transactions on Systems Man, and Cybernetics"},{"key":"14231_CR36","doi-asserted-by":"crossref","unstructured":"Taghipour N, Kardan A (2008) A hybrid web recommender system based on q-learning. In: Proceedings of the ACM Symposium on Applied Computing (SAC), Fortaleza, Ceara, Brazil, pp. 1164\u20131168, March, 16\u201320, 2008","DOI":"10.1145\/1363686.1363954"},{"key":"14231_CR37","doi-asserted-by":"crossref","unstructured":"Tao Y, Wang C, Yao L, Li W, Yu Y (2021) Item trend learning for sequential recommendation system using gated graph neural network. Neural Comput & Applic, 1\u201316","DOI":"10.1007\/s00521-021-05723-2"},{"key":"14231_CR38","unstructured":"Van Hasselt H, Doron Y, Strub F, Hessel M, Sonnerat N, Modayil J (2018) Deep reinforcement learning and the deadly triad, arXiv:1812.02648"},{"key":"14231_CR39","unstructured":"Van den Oord A, Dieleman S, Schrauwen B (2013) Deep content-based music recommendation. NIPS, 2643\u20132651"},{"key":"14231_CR40","doi-asserted-by":"crossref","unstructured":"Vincent P, Larochelle H, Bengio Y, Manzagol PA (2008) Extracting and composing robust features with denoising autoencoders. In: Proceedings of the 25th International Conference on Machine Learning, Helsinki, Finland, 1096\u20131103","DOI":"10.1145\/1390156.1390294"},{"key":"14231_CR41","unstructured":"Vozalis M, Margaritis K (2004) Collaborative filtering enhanced by Demographic Correleation"},{"key":"14231_CR42","first-page":"117","volume":"2","author":"M Vozalis","year":"2006","unstructured":"Vozalis M, Margaritis K (2006) On the enhancement of collaborative filtering by demographic data. Web Intelligence and Agent Systems 2:117\u2013138","journal-title":"Web Intelligence and Agent Systems"},{"key":"14231_CR43","doi-asserted-by":"crossref","unstructured":"Wang H, Wang N, Yeung DY (2015) Collaborative deep learning for recommender systems. KDD, 1235\u20131244","DOI":"10.1145\/2783258.2783273"},{"key":"14231_CR44","doi-asserted-by":"crossref","unstructured":"Wei K, Huang J, Fu S (2007) A survey of e-commerce recommender systems. In: 2007 International conference on service systems and service management. pp 1\u20135","DOI":"10.1109\/ICSSSM.2007.4280214"},{"key":"14231_CR45","doi-asserted-by":"crossref","unstructured":"Wilcoxon F (1945) Individual comparisons by ranking methods. Biometrics Bulletin, 80\u201383","DOI":"10.2307\/3001968"},{"key":"14231_CR46","doi-asserted-by":"crossref","unstructured":"Wu Y, DuBois C, Zheng AX, Ester M (2016) Collaborative denoising auto-encoders for top-N recommender systems. In: Proceedings of the Ninth ACM International Conference on Web Search and Data Mining, pp 153\u2013162","DOI":"10.1145\/2835776.2835837"},{"key":"14231_CR47","unstructured":"Wu C, Rajeswaran A, Duan Y, Kumar V, Bayen AM, Kakade S, Mordatch I, Abbeel P (2018) Variance reduction for policy gradient with action-dependent factorized baselines, arXiv:1803.07246"},{"key":"14231_CR48","doi-asserted-by":"crossref","unstructured":"Xue H, Dai X, Zhang J, Huang S, Chen J (2017) Deep matrix factorization models for recommender systems, IJCAI 3203\u20133209, 17, Melbourne, Australia","DOI":"10.24963\/ijcai.2017\/447"},{"key":"14231_CR49","doi-asserted-by":"crossref","unstructured":"Zhang S, Yao L, Sun A, Tay Y (2019) Deep Learning Based Recommender System: A Survey and New Perspectives. ACM Comput. Surv., 52","DOI":"10.1145\/3285029"},{"key":"14231_CR50","doi-asserted-by":"crossref","unstructured":"Zhao X, Xia L, Zhang L, Ding Z, Yin D, Tang J (2018) Deep reinforcement learning for page-wise recommendations, abs\/1801.00209","DOI":"10.1145\/3240323.3240374"},{"key":"14231_CR51","doi-asserted-by":"crossref","unstructured":"Zhao X, Zhang L, Ding Z, Xia L, Tang J, Yin D (2018) Recommendations with negative feedback via pairwise deep reinforcement learning. Corr2, abs\/1802.06501","DOI":"10.1145\/3219819.3219886"},{"key":"14231_CR52","first-page":"167","volume":"2","author":"G Zheng","year":"2018","unstructured":"Zheng G, Zhang F, Zheng Z, Xiang Y, Nicholas J, Xie X, Li ZDRN (2018) A deep reinforcement learning framework for news recommendation. International World Wide Web Conferences Steering Committee 2:167\u2013176","journal-title":"International World Wide Web Conferences Steering Committee"},{"key":"14231_CR53","doi-asserted-by":"crossref","unstructured":"Zheng G, Zhang F, Zheng Z, Xiang Y, Yuan NJ, Xie X, Li ZDRN (2018) DRN: a deep reinforcement learning framework for news recommendation. WWW 2018, Lyon, France, April, 23-27, 167\u2013176","DOI":"10.1145\/3178876.3185994"},{"key":"14231_CR54","doi-asserted-by":"crossref","unstructured":"Zou L, Xia L, Du P, Zhang Z, Bai T, Liu W, Nie JY, Yin D (2020) Pseudo Dyna-Q: a reinforcement learning framework for interactive recommendation. In: Association for computing machinery, New York, NY, USA, pp. 816\u2013824","DOI":"10.1145\/3336191.3371801"},{"key":"14231_CR55","doi-asserted-by":"crossref","unstructured":"Zou L, Xia L, Gu Y, Zhao X, Liu W, Huang J, Yin D (2020) Neural interactive collaborative filtering. In: Proceedings of the 43rd International ACM SIGIR Conference on Research and Development in Information Retrieval, pp 749\u2013758","DOI":"10.1145\/3397271.3401181"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-022-14231-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-022-14231-x\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-022-14231-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,4,22]],"date-time":"2023-04-22T04:16:36Z","timestamp":1682136996000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-022-14231-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,12,15]]},"references-count":55,"journal-issue":{"issue":"13","published-print":{"date-parts":[[2023,5]]}},"alternative-id":["14231"],"URL":"https:\/\/doi.org\/10.1007\/s11042-022-14231-x","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"value":"1380-7501","type":"print"},{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,12,15]]},"assertion":[{"value":"19 March 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 June 2022","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 November 2022","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 December 2022","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"All authors declare that they have no conflicts of interest and this research received no funding.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"<!--Emphasis Type='Bold' removed-->Conflict of Interests"}}]}}