{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,30]],"date-time":"2025-12-30T08:52:11Z","timestamp":1767084731978,"version":"3.40.5"},"reference-count":46,"publisher":"Informa UK Limited","issue":"16","content-domain":{"domain":["www.tandfonline.com"],"crossmark-restriction":true},"short-container-title":["Advanced Robotics"],"published-print":{"date-parts":[[2021,8,18]]},"DOI":"10.1080\/01691864.2021.1959397","type":"journal-article","created":{"date-parts":[[2021,7,31]],"date-time":"2021-07-31T18:41:24Z","timestamp":1627756884000},"page":"1012-1027","update-policy":"https:\/\/doi.org\/10.1080\/tandf_crossmark_01","source":"Crossref","is-referenced-by-count":6,"title":["Safe and efficient imitation learning by clarification of experienced latent space"],"prefix":"10.1080","volume":"35","author":[{"given":"Hidehito","family":"Fujiishi","sequence":"first","affiliation":[{"name":"Division of Information Science, Nara Institute of Science and Technology, Nara, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3760-249X","authenticated-orcid":false,"given":"Taisuke","family":"Kobayashi","sequence":"additional","affiliation":[{"name":"Division of Information Science, Nara Institute of Science and Technology, Nara, Japan"}]},{"given":"Kenji","family":"Sugimoto","sequence":"additional","affiliation":[{"name":"Division of Information Science, Nara Institute of Science and Technology, Nara, Japan"}]}],"member":"301","published-online":{"date-parts":[[2021,7,31]]},"reference":[{"key":"CIT0001","doi-asserted-by":"publisher","DOI":"10.1016\/j.robot.2018.11.004"},{"key":"CIT0002","doi-asserted-by":"publisher","DOI":"10.1080\/01691864.2020.1844797"},{"key":"CIT0003","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2020.2974707"},{"volume-title":"Reinforcement learning: an introduction","year":"2018","author":"Sutton RS","key":"CIT0004"},{"key":"CIT0005","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8794127"},{"key":"CIT0006","doi-asserted-by":"publisher","DOI":"10.1098\/rstb.2002.1258"},{"key":"CIT0007","doi-asserted-by":"crossref","unstructured":"Bain M, Sammut C. A framework for behavioural cloning. In: Machine Intelligence; 1995. p. 103\u2013129.","DOI":"10.1093\/oso\/9780198538677.003.0006"},{"key":"CIT0008","unstructured":"Bojarski M, Del Testa D, Dworakowski D, et\u00a0al. End to end learning for self-driving cars. arXiv preprint arXiv:160407316. 2016."},{"key":"CIT0009","doi-asserted-by":"publisher","DOI":"10.1109\/70.538982"},{"key":"CIT0010","doi-asserted-by":"publisher","DOI":"10.1038\/nature10489"},{"key":"CIT0011","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2018\/687"},{"key":"CIT0012","doi-asserted-by":"publisher","DOI":"10.1109\/IEEECONF49454.2021.9382751"},{"key":"CIT0013","unstructured":"Kingma DP, Welling M. Auto-encoding variational Bayes. In: International Conference on Learning Representations. 2014."},{"key":"CIT0014","unstructured":"Higgins I, Matthey L, Pal A, et\u00a0al. Beta-vae: learning basic visual concepts with a constrained variational framework. In: International Conference on Learning Representations. 2017."},{"key":"CIT0015","unstructured":"Ng AY, Russell SJ. Algorithms for inverse reinforcement learning. In: International Conference on Machine Learning. 2000. p. 663\u2013670."},{"key":"CIT0016","unstructured":"Ho J, Ermon S. Generative adversarial imitation learning. arXiv preprint arXiv:160603476. 2016."},{"key":"CIT0017","unstructured":"Edwards A, Sahni H, Schroecker Y, et\u00a0al. Imitating latent policies from observation. In: International Conference on Machine Learning. PMLR; 2019. p. 1755\u20131763."},{"key":"CIT0018","doi-asserted-by":"crossref","unstructured":"Torabi F, Warnell G, Stone P. Generative adversarial imitation from observation. arXiv preprint arXiv:180706158. 2018.","DOI":"10.24963\/ijcai.2018\/687"},{"key":"CIT0019","unstructured":"Singh S, Silakari S. An ensemble approach for feature selection of cyber attack dataset. arXiv preprint arXiv:09121014. 2009."},{"key":"CIT0020","doi-asserted-by":"publisher","DOI":"10.1016\/j.jnca.2005.06.003"},{"key":"CIT0021","unstructured":"Ruff L, Vandermeulen RA, Franks BJ, et\u00a0al. Rethinking assumptions in deep anomaly detection. arXiv preprint arXiv:200600339. 2020."},{"key":"CIT0022","doi-asserted-by":"publisher","DOI":"10.1142\/S0218001409007326"},{"key":"CIT0023","unstructured":"M\u00fcnz G, Li S, Carle G. Traffic anomaly detection using k-means clustering. In: GI\/ITG Workshop MMBnet. 2007. p. 13\u201314."},{"key":"CIT0024","doi-asserted-by":"publisher","DOI":"10.1145\/2500853.2500857"},{"key":"CIT0025","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33019428"},{"issue":"1","key":"CIT0026","first-page":"1","volume":"2","author":"An J","year":"2015","journal-title":"Spec Lectur on IE"},{"key":"CIT0027","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00867"},{"key":"CIT0028","doi-asserted-by":"publisher","DOI":"10.1109\/ICMLA.2019.00270"},{"key":"CIT0029","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0152173"},{"key":"CIT0030","unstructured":"Nalisnick E, Matsukawa A, Teh YW, et\u00a0al. Do deep generative models know what they don't know? arXiv preprint arXiv:181009136. 2018."},{"key":"CIT0031","unstructured":"Kirichenko P, Izmailov P, Wilson AG. Why normalizing flows fail to detect out-of-distribution data. arXiv preprint arXiv:200608545. 2020."},{"key":"CIT0032","unstructured":"Nalisnick E, Matsukawa A, Teh YW, et\u00a0al. Detecting out-of-distribution inputs to deep generative models using typicality. arXiv preprint arXiv:190602994. 2019."},{"key":"CIT0033","doi-asserted-by":"publisher","DOI":"10.1126\/science.1127647"},{"key":"CIT0034","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.2992934"},{"key":"CIT0035","unstructured":"Dinh L, Sohl-Dickstein J, Bengio S. Density estimation using real nvp. arXiv preprint arXiv:160508803. 2016."},{"key":"CIT0036","doi-asserted-by":"publisher","DOI":"10.1007\/978-0-387-73003-5_196"},{"key":"CIT0037","unstructured":"Bhalodia R, Lee I, Elhabian S. dpvaes: fixing sample generation for regularized vaes. arXiv preprint arXiv:191110506. 2019."},{"key":"CIT0038","unstructured":"Brockman G, Cheung V, Pettersson L, et\u00a0al. Openai gym. arXiv preprint arXiv:160601540. 2016."},{"key":"CIT0039","unstructured":"Schulman J, Wolski F, Dhariwal P, et\u00a0al. Proximal policy optimization algorithms. arXiv preprint arXiv:170706347. 2017."},{"key":"CIT0040","unstructured":"Kingma DP, Ba JAdam. A method for stochastic optimization. arXiv preprint arXiv:14126980. 2014."},{"key":"CIT0041","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8793484"},{"key":"CIT0042","unstructured":"Eysenbach B, Gu S, Ibarz J, et\u00a0al. Leave no trace: learning to reset for safe and autonomous reinforcement learning. arXiv preprint arXiv:171106782. 2017."},{"key":"CIT0043","doi-asserted-by":"crossref","unstructured":"Thananjeyan B, Balakrishna A, Nair S, et\u00a0al. Recovery rl: safe reinforcement learning with learned recovery zones. arXiv preprint arXiv:201015920. 2020.","DOI":"10.1109\/LRA.2021.3070252"},{"key":"CIT0044","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.1611835114"},{"key":"CIT0045","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2018.8460487"},{"key":"CIT0046","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01234-2_36"}],"container-title":["Advanced Robotics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.tandfonline.com\/doi\/pdf\/10.1080\/01691864.2021.1959397","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,11,6]],"date-time":"2023-11-06T18:53:46Z","timestamp":1699296826000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.tandfonline.com\/doi\/full\/10.1080\/01691864.2021.1959397"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,7,31]]},"references-count":46,"journal-issue":{"issue":"16","published-print":{"date-parts":[[2021,8,18]]}},"alternative-id":["10.1080\/01691864.2021.1959397"],"URL":"https:\/\/doi.org\/10.1080\/01691864.2021.1959397","relation":{},"ISSN":["0169-1864","1568-5535"],"issn-type":[{"type":"print","value":"0169-1864"},{"type":"electronic","value":"1568-5535"}],"subject":[],"published":{"date-parts":[[2021,7,31]]},"assertion":[{"value":"The publishing and review policy for this title is described in its Aims & Scope.","order":1,"name":"peerreview_statement","label":"Peer Review Statement"},{"value":"http:\/\/www.tandfonline.com\/action\/journalInformation?show=aimsScope&journalCode=tadr20","URL":"http:\/\/www.tandfonline.com\/action\/journalInformation?show=aimsScope&journalCode=tadr20","order":2,"name":"aims_and_scope_url","label":"Aim & Scope"},{"value":"2021-04-06","order":0,"name":"received","label":"Received","group":{"name":"publication_history","label":"Publication History"}},{"value":"2021-07-12","order":2,"name":"accepted","label":"Accepted","group":{"name":"publication_history","label":"Publication History"}},{"value":"2021-07-31","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}