{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,19]],"date-time":"2026-05-19T07:39:44Z","timestamp":1779176384220,"version":"3.51.4"},"reference-count":41,"publisher":"Springer Science and Business Media LLC","issue":"7849","license":[{"start":{"date-parts":[[2021,3,10]],"date-time":"2021-03-10T00:00:00Z","timestamp":1615334400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,3,10]],"date-time":"2021-03-10T00:00:00Z","timestamp":1615334400000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Nature"],"published-print":{"date-parts":[[2021,3,11]]},"DOI":"10.1038\/s41586-021-03242-7","type":"journal-article","created":{"date-parts":[[2021,3,10]],"date-time":"2021-03-10T17:04:19Z","timestamp":1615395859000},"page":"229-233","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":151,"title":["Experimental quantum speed-up in reinforcement\u00a0learning agents"],"prefix":"10.1038","volume":"591","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8746-9431","authenticated-orcid":false,"given":"V.","family":"Saggio","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"B. E.","family":"Asenbeck","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9016-3641","authenticated-orcid":false,"given":"A.","family":"Hamann","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"T.","family":"Str\u00f6mberg","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"P.","family":"Schiansky","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"V.","family":"Dunjko","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1950-8640","authenticated-orcid":false,"given":"N.","family":"Friis","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"N. C.","family":"Harris","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"M.","family":"Hochberg","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1043-3489","authenticated-orcid":false,"given":"D.","family":"Englund","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9137-4814","authenticated-orcid":false,"given":"S.","family":"W\u00f6lk","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"H. J.","family":"Briegel","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4964-817X","authenticated-orcid":false,"given":"P.","family":"Walther","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2021,3,10]]},"reference":[{"key":"3242_CR1","doi-asserted-by":"crossref","unstructured":"Sutton, R. S. & Barto, A. G. Reinforcement Learning: An Introduction (MIT Press, 1998).","DOI":"10.1109\/TNN.1998.712192"},{"key":"3242_CR2","doi-asserted-by":"publisher","first-page":"130501","DOI":"10.1103\/PhysRevLett.117.130501","volume":"117","author":"V Dunjko","year":"2016","unstructured":"Dunjko, V., Taylor, J. M. & Briegel, H. J. Quantum-enhanced machine learning. Phys. Rev. Lett. 117, 130501 (2016).","journal-title":"Phys. Rev. Lett."},{"key":"3242_CR3","first-page":"031002","volume":"4","author":"GD Paparo","year":"2014","unstructured":"Paparo, G. D., Dunjiko, V., Makmal, A., Martin-Delgrado, M. A. & Briegel, H. J. Quantum speedup for active learning agents. Phys. Rev. X4, 031002 (2014).","journal-title":"Phys. Rev. X"},{"key":"3242_CR4","doi-asserted-by":"publisher","first-page":"015014","DOI":"10.1088\/2058-9565\/aaef5e","volume":"4","author":"T Sriarunothai","year":"2019","unstructured":"Sriarunothai, T. et al. Speeding-up the decision making of a learning agent using an ion trap quantum processor. Quantum Sci. Technol. 4, 015014 (2019).","journal-title":"Quantum Sci. Technol."},{"key":"3242_CR5","doi-asserted-by":"crossref","unstructured":"Johannink, T. et al. Residual reinforcement learning for robot control. In 2019 International Conference on Robotics and Automation (ICRA) 6023\u20136029 (IEEE, 2019).","DOI":"10.1109\/ICRA.2019.8794127"},{"key":"3242_CR6","doi-asserted-by":"crossref","unstructured":"Tjandra, A., Sakti, S. & Nakamura, S. Sequence-to-aequence ASR optimization via reinforcement learning. In 2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP) 5829\u20135833 (IEEE, 2018).","DOI":"10.1109\/ICASSP.2018.8461705"},{"key":"3242_CR7","doi-asserted-by":"publisher","first-page":"1716","DOI":"10.1038\/s41591-018-0213-5","volume":"24","author":"M Komorowski","year":"2018","unstructured":"Komorowski, M., Celi, L. A., Badawi, O., Gordon, A. C. & Faisal A. A. The artificial intelligence clinician learns optimal treatment strategies for sepsis in intensive care. Nat. Med. 24, 1716\u20131720 (2018).","journal-title":"Nat. Med."},{"key":"3242_CR8","doi-asserted-by":"publisher","first-page":"891","DOI":"10.3389\/fnins.2018.00891","volume":"12","author":"CS Thakur","year":"2018","unstructured":"Thakur, C. S. et al. Large-scale neuromorphic spiking array processors: a quest to mimic the brain. Front. Neurosci. 12, 891 (2018).","journal-title":"Front. Neurosci."},{"key":"3242_CR9","doi-asserted-by":"publisher","DOI":"10.1038\/s41534-019-0174-7","volume":"5","author":"GR Steinbrecher","year":"2019","unstructured":"Steinbrecher, G. R., Olson, J. P., Englund, D. & Carolan, J. Quantum optical neural networks. npj Quantum Inf. 5, 60 (2019).","journal-title":"npj Quantum Inf."},{"key":"3242_CR10","doi-asserted-by":"publisher","first-page":"354","DOI":"10.1038\/nature24270","volume":"550","author":"D Silver","year":"2017","unstructured":"Silver, D. et al. Mastering the game of Go without human knowledge. Nature550, 354\u2013359 (2017).","journal-title":"Nature"},{"key":"3242_CR11","doi-asserted-by":"publisher","first-page":"505","DOI":"10.1038\/s41586-019-1666-5","volume":"574","author":"F Arute","year":"2019","unstructured":"Arute, F. et al. Quantum supremacy using a programmable superconducting processor. Nature574, 505\u2013510 (2019).","journal-title":"Nature"},{"key":"3242_CR12","doi-asserted-by":"publisher","first-page":"1207","DOI":"10.1109\/TSMCB.2008.925743","volume":"38","author":"D Dong","year":"2008","unstructured":"Dong. D., Chen, C., Li, H. & Tarn, T.-J. Quantum reinforcement learning. IEEE Trans. Syst. Man Cybern. B38, 1207\u20131220 (2008).","journal-title":"IEEE Trans. Syst. Man Cybern. B"},{"key":"3242_CR13","doi-asserted-by":"publisher","first-page":"074001","DOI":"10.1088\/1361-6633\/aab406","volume":"81","author":"V Dunjko","year":"2018","unstructured":"Dunjko, V. & Briegel, H. J. Machine learning & artificial intelligence in the quantum domain: a review of recent progress. Rep. Prog. Phys. 81, 074001 (2018).","journal-title":"Rep. Prog. Phys."},{"key":"3242_CR14","doi-asserted-by":"publisher","first-page":"48","DOI":"10.22331\/q-2018-01-29-48","volume":"2","author":"P Baireuther","year":"2018","unstructured":"Baireuther, P., O\u2019Brien, T. E., Tarasinski, B. & Beenakker, C. W. J. Machine-learning-assisted correction of correlated qubit errors in a topological code. Quantum2, 48 (2018).","journal-title":"Quantum"},{"key":"3242_CR15","doi-asserted-by":"publisher","first-page":"68","DOI":"10.22331\/q-2018-05-24-68","volume":"2","author":"NP Breuckmann","year":"2018","unstructured":"Breuckmann, N. P. & Ni, X. Scalable neural network decoders for higher dimensional quantum codes. Quantum2, 68\u201392 (2018).","journal-title":"Quantum"},{"key":"3242_CR16","doi-asserted-by":"publisher","first-page":"044002","DOI":"10.1088\/2058-9565\/aad1f7","volume":"3","author":"C Chamberland","year":"2018","unstructured":"Chamberland, C. & Ronagh, P. Deep neural decoders for near term fault-tolerant experiments. Quant. Sci. Technol. 3, 044002 (2018).","journal-title":"Quant. Sci. Technol."},{"key":"3242_CR17","first-page":"031084","volume":"8","author":"T F\u00f6sel","year":"2018","unstructured":"F\u00f6sel, T., Tighineanu, P., Weiss, T. & Marquardt, F. Reinforcement learning with neural networks for quantum feedback. Phys. Rev. X8, 031084 (2018).","journal-title":"Phys. Rev. X"},{"key":"3242_CR18","doi-asserted-by":"publisher","first-page":"215","DOI":"10.22331\/q-2019-12-16-215","volume":"3","author":"H Poulsen Nautrup","year":"2019","unstructured":"Poulsen Nautrup, H., Delfosse, N., Dunjko, V., Briegel, H. J. & Friis, N. Optimizing quantum error correction codes with reinforcement learning. Quantum3, 215 (2019).","journal-title":"Quantum"},{"key":"3242_CR19","doi-asserted-by":"publisher","first-page":"1800074","DOI":"10.1002\/qute.201800074","volume":"2","author":"S Yu","year":"2019","unstructured":"Yu, S. et al. Reconstruction of a photonic qubit state with reinforcement learning. Adv. Quantum Technol. 2, 1800074 (2019).","journal-title":"Adv. Quantum Technol."},{"key":"3242_CR20","doi-asserted-by":"publisher","first-page":"090405","DOI":"10.1103\/PhysRevLett.116.090405","volume":"116","author":"M Krenn","year":"2016","unstructured":"Krenn, M., Malik, M., Fickler, R., Lapkiewicz, R. & Zeilinger, A. Automated search for new quantum experiments. Phys. Rev. Lett. 116, 090405 (2016).","journal-title":"Phys. Rev. Lett."},{"key":"3242_CR21","doi-asserted-by":"publisher","first-page":"1221","DOI":"10.1073\/pnas.1714936115","volume":"115","author":"AA Melnikov","year":"2018","unstructured":"Melnikov, A. A. et al. Active learning machine learns to create new quantum experiments. Proc. Natl Acad. Sci. USA115, 1221\u20131226 (2018).","journal-title":"Proc. Natl Acad. Sci. USA"},{"key":"3242_CR22","doi-asserted-by":"publisher","first-page":"023006","DOI":"10.1088\/1367-2630\/17\/2\/023006","volume":"17","author":"V Dunjko","year":"2015","unstructured":"Dunjko, V., Friis, N. & Briegel, H. J. Quantum-enhanced deliberation of learning agents using trapped ions. New J. Phys. 17, 023006 (2015).","journal-title":"New J. Phys."},{"key":"3242_CR23","unstructured":"Jerbi, S., Poulsen Nautrup, H., Trenkwalder, L. M., Briegel, H. J. & Dunjko, V. A framework for deep energy-based reinforcement learning with quantum speed-up. Preprint at https:\/\/arxiv.org\/abs\/1910.12760 (2019)."},{"key":"3242_CR24","doi-asserted-by":"publisher","first-page":"1023","DOI":"10.1038\/nature07127","volume":"453","author":"HJ Kimble","year":"2008","unstructured":"Kimble, H. J. The quantum internet. Nature453, 1023\u20131030 (2008).","journal-title":"Nature"},{"key":"3242_CR25","doi-asserted-by":"publisher","first-page":"137","DOI":"10.1109\/MNET.001.1900092","volume":"34","author":"AS Cacciapuoti","year":"2020","unstructured":"Cacciapuoti, A. S. et al. Quantum internet: networking challenges in distributed quantum computing. IEEE Netw. 34, 137\u2013143 (2020).","journal-title":"IEEE Netw."},{"key":"3242_CR26","doi-asserted-by":"publisher","DOI":"10.1038\/srep00400","volume":"2","author":"HJ Briegel","year":"2012","unstructured":"Briegel, H. J. & De las Cuevas, G. Projective simulation for artificial intelligence. Sci. Rep. 2, 400 (2012).","journal-title":"Sci. Rep."},{"key":"3242_CR27","doi-asserted-by":"publisher","first-page":"325","DOI":"10.1103\/PhysRevLett.79.325","volume":"79","author":"LK Grover","year":"1997","unstructured":"Grover, L. K. Quantum mechanics helps in searching for a needle in a haystack. Phys. Rev. Lett. 79, 325\u2013328 (1997).","journal-title":"Phys. Rev. Lett."},{"key":"3242_CR28","unstructured":"Nielsen, M. A. & Chuang, I. L. Quantum Computation and Quantum Information (Cambridge Univ. Press, 2000)."},{"key":"3242_CR29","doi-asserted-by":"publisher","first-page":"045002","DOI":"10.1088\/1367-2630\/ab783c","volume":"22","author":"F Flamini","year":"2020","unstructured":"Flamini, F. et al. Photonic architecture for reinforcement learning. New. J. Phys. 22, 045002 (2020).","journal-title":"New. J. Phys."},{"key":"3242_CR30","doi-asserted-by":"publisher","first-page":"447","DOI":"10.1038\/nphoton.2017.95","volume":"11","author":"NC Harris","year":"2017","unstructured":"Harris, N. C. et al. Quantum transport simulations in a programmable nanophotonic processor. Nat. Photon. 11, 447\u2013452 (2017).","journal-title":"Nat. Photon."},{"key":"3242_CR31","doi-asserted-by":"publisher","first-page":"493","DOI":"10.1002\/(SICI)1521-3978(199806)46:4\/5<493::AID-PROP493>3.0.CO;2-P","volume":"46","author":"M Boyer","year":"1998","unstructured":"Boyer, M., Brassard, G., Hoyer, P. & Tappa, A. Tight bounds on quantum searching. Fortschr. Phys. 46, 493\u2013505 (1998).","journal-title":"Fortschr. Phys."},{"key":"3242_CR32","doi-asserted-by":"publisher","first-page":"1026","DOI":"10.1038\/nnano.2017.218","volume":"12","author":"P Senellart","year":"2017","unstructured":"Senellart, P., Solomon, G. & White, A. High-performance semiconductor quantum-dot single-photon sources. Nat. Nanotechnol. 12, 1026\u20131039 (2017).","journal-title":"Nat. Nanotechnol."},{"key":"3242_CR33","doi-asserted-by":"publisher","first-page":"226","DOI":"10.1038\/s41586-020-2441-3","volume":"583","author":"NH Wan","year":"2020","unstructured":"Wan, N. H. et al. Large-scale integration of artificial atoms in hybrid photonic circuits. Nature583, 226\u2013231 (2020).","journal-title":"Nature"},{"key":"3242_CR34","doi-asserted-by":"publisher","first-page":"356","DOI":"10.1038\/nphoton.2014.53","volume":"8","author":"TE Northup","year":"2014","unstructured":"Northup, T. E. & Blatt, R. Quantum information transfer using photons. Nat. Photon. 8, 356\u2013363 (2014).","journal-title":"Nat. Photon."},{"key":"3242_CR35","unstructured":"Denil, M. et al. Learning to perform physics experiments via deep reinforcement learning. Proc. Int. Conf. on Learning Representations (2017)."},{"key":"3242_CR36","first-page":"031086","volume":"8","author":"M Bukov","year":"2018","unstructured":"Bukov, M. et al. Reinforcement learning in different phases of quantum control. Phys. Rev. X8, 031086 (2018).","journal-title":"Phys. Rev. X"},{"key":"3242_CR37","unstructured":"Poulsen Nautrup, H. et al. Operationally meaningful representations of physical systems in neural networks. Preprint at https:\/\/arxiv.org\/abs\/2001.00593 (2020)."},{"key":"3242_CR38","doi-asserted-by":"publisher","first-page":"210501","DOI":"10.1103\/PhysRevLett.113.210501","volume":"113","author":"TJ Yoder","year":"2014","unstructured":"Yoder, T. J., Low, G. H. & Chuang, I. L. Fixed-point quantum search with an optimal number of queries. Phys. Rev. Lett. 113, 210501 (2014).","journal-title":"Phys. Rev. Lett."},{"key":"3242_CR39","doi-asserted-by":"publisher","first-page":"012316","DOI":"10.1103\/PhysRevA.73.012316","volume":"73","author":"T Kim","year":"2006","unstructured":"Kim, T., Fiorentino, M. & Wong, F. N. C. Phase-stable source of polarization-entangled photons using a polarization Sagnac interferometer. Phys. Rev. A73, 012316 (2006).","journal-title":"Phys. Rev. A"},{"key":"3242_CR40","doi-asserted-by":"publisher","first-page":"935","DOI":"10.1038\/s41567-019-0550-4","volume":"15","author":"V Saggio","year":"2019","unstructured":"Saggio, V. et al. Experimental few-copy multipartite entanglement detection. Nat. Phys. 15, 935\u2013940 (2019).","journal-title":"Nat. Phys."},{"key":"3242_CR41","doi-asserted-by":"publisher","first-page":"210","DOI":"10.1038\/nphoton.2013.13","volume":"7","author":"F Marsili","year":"2013","unstructured":"Marsili, F. et al. Detecting single infrared photons with 93% system efficiency. Nat. Photon. 7, 210\u2013214 (2013).","journal-title":"Nat. Photon."}],"container-title":["Nature"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/www.nature.com\/articles\/s41586-021-03242-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/www.nature.com\/articles\/s41586-021-03242-7","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/www.nature.com\/articles\/s41586-021-03242-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,5,20]],"date-time":"2023-05-20T22:09:03Z","timestamp":1684620543000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.nature.com\/articles\/s41586-021-03242-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,3,10]]},"references-count":41,"journal-issue":{"issue":"7849","published-print":{"date-parts":[[2021,3,11]]}},"alternative-id":["3242"],"URL":"https:\/\/doi.org\/10.1038\/s41586-021-03242-7","relation":{},"ISSN":["0028-0836","1476-4687"],"issn-type":[{"value":"0028-0836","type":"print"},{"value":"1476-4687","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,3,10]]},"assertion":[{"value":"12 August 2020","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 January 2021","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"10 March 2021","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"The authors declare no competing interests.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}]}}