{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,15]],"date-time":"2026-01-15T00:35:58Z","timestamp":1768437358731,"version":"3.49.0"},"reference-count":45,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,6,30]],"date-time":"2024-06-30T00:00:00Z","timestamp":1719705600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,6,30]],"date-time":"2024-06-30T00:00:00Z","timestamp":1719705600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100010002","name":"Ministry of Education","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100010002","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,6,30]]},"DOI":"10.1109\/ijcnn60899.2024.10651268","type":"proceedings-article","created":{"date-parts":[[2024,9,9]],"date-time":"2024-09-09T17:35:05Z","timestamp":1725903305000},"page":"1-9","source":"Crossref","is-referenced-by-count":4,"title":["BCQQ: Batch-Constraint Quantum Q-Learning with Cyclic Data Re-uploading"],"prefix":"10.1109","author":[{"given":"Maniraman","family":"Periyasamy","sequence":"first","affiliation":[{"name":"Fraunhofer Institute for Integrated Circuits IIS,Fraunhofer IIS,Nuremberg,Germany"}]},{"given":"Marc","family":"H\u00f6lle","sequence":"additional","affiliation":[{"name":"Fraunhofer Institute for Integrated Circuits IIS,Fraunhofer IIS,Nuremberg,Germany"}]},{"given":"Marco","family":"Wiedmann","sequence":"additional","affiliation":[{"name":"Fraunhofer Institute for Integrated Circuits IIS,Fraunhofer IIS,Nuremberg,Germany"}]},{"given":"Daniel D.","family":"Scherer","sequence":"additional","affiliation":[{"name":"Fraunhofer Institute for Integrated Circuits IIS,Fraunhofer IIS,Nuremberg,Germany"}]},{"given":"Axel","family":"Plinge","sequence":"additional","affiliation":[{"name":"Fraunhofer Institute for Integrated Circuits IIS,Fraunhofer IIS,Nuremberg,Germany"}]},{"given":"Christopher","family":"Mutschler","sequence":"additional","affiliation":[{"name":"Fraunhofer Institute for Integrated Circuits IIS,Fraunhofer IIS,Nuremberg,Germany"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1126\/science.aar6404"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1038\/s41586-022-05172-4"},{"key":"ref3","article-title":"Striving for simplicity in off-policy deep reinforcement learning","author":"Agarwal","year":"2020"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1103\/physrevc.106.034325"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevX.6.031007"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2023.3234911"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1038\/s41467-022-32550-3"},{"key":"ref8","article-title":"A survey on quantum reinforcement learning","author":"Meyer","year":"2022"},{"key":"ref9","article-title":"Openai gym","volume-title":"CoRR","author":"Brockman","year":"2016"},{"key":"ref10","article-title":"Benchmarking batch deep reinforcement learning algorithms","author":"Fujimoto","year":"2019"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-27645-3_1"},{"key":"ref12","volume-title":"Reinforcement learning: An introduction","author":"Sutton","year":"2018"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1038\/nature14236"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevA.101.032308"},{"key":"ref15","article-title":"Hybrid quantum-classical classifier based on tensor network and variational quantum circuit","author":"Chen","year":"2020"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/JHEP02(2021)212"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1017\/cbo9780511976667"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevA.98.032309"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevA.103.032430"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.3389\/fphy.2020.00297"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.22331\/q-2022-05-24-720"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1103\/physreva.99.032331"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1007\/s11128-021-03140-x"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1103\/physreva.107.032407"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.3390\/molecules27030597"},{"key":"ref26","article-title":"On the convergence of adam and beyond","author":"Reddi","year":"2019"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/QCE57702.2023.00058"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1007\/11539117_97"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/TSMCB.2008.925743"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1145\/237814.237866"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.3010470"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i6.25872"},{"key":"ref33","first-page":"2052","article-title":"Off-policy deep reinforcement learning without exploration","volume-title":"International conference on machine learning","author":"Fujimoto"},{"key":"ref34","first-page":"263","article-title":"Issues in using function approximation for reinforcement learning","volume-title":"Proceedings of the Fourth Connectionist Models Summer School","volume":"255","author":"Thrun"},{"key":"ref35","article-title":"Offline reinforcement learning: Tutorial, review, and perspectives on open problems","author":"Levine","year":"2020"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.5555\/3016100.3016191"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1016\/j.jfranklin.2022.08.021"},{"key":"ref38","first-page":"24 592","article-title":"Quantum policy gradient algorithm with optimized action decoding","volume-title":"International Conference on Machine Learning","author":"Meyer"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.22331\/q-2020-02-06-226"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/QCE53715.2022.00021"},{"key":"ref41","article-title":"A scale-dependent notion of effective dimension","author":"Berezniuk","year":"2020"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1038\/s43588-021-00084-1"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/18.481776"},{"key":"ref44","article-title":"Qiskit: An open-source framework for quantum computing","year":"2023"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1103\/physrevlett.119.180509"}],"event":{"name":"2024 International Joint Conference on Neural Networks (IJCNN)","location":"Yokohama, Japan","start":{"date-parts":[[2024,6,30]]},"end":{"date-parts":[[2024,7,5]]}},"container-title":["2024 International Joint Conference on Neural Networks (IJCNN)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10649807\/10649898\/10651268.pdf?arnumber=10651268","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,10]],"date-time":"2024-09-10T06:38:35Z","timestamp":1725950315000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10651268\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,6,30]]},"references-count":45,"URL":"https:\/\/doi.org\/10.1109\/ijcnn60899.2024.10651268","relation":{},"subject":[],"published":{"date-parts":[[2024,6,30]]}}}