{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,5]],"date-time":"2026-05-05T22:10:29Z","timestamp":1778019029545,"version":"3.51.4"},"reference-count":34,"publisher":"IEEE","license":[{"start":{"date-parts":[[2020,11,1]],"date-time":"2020-11-01T00:00:00Z","timestamp":1604188800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,11,1]],"date-time":"2020-11-01T00:00:00Z","timestamp":1604188800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,11,1]],"date-time":"2020-11-01T00:00:00Z","timestamp":1604188800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020,11]]},"DOI":"10.1109\/biorob49111.2020.9224421","type":"proceedings-article","created":{"date-parts":[[2020,10,15]],"date-time":"2020-10-15T20:05:32Z","timestamp":1602792332000},"page":"878-884","source":"Crossref","is-referenced-by-count":12,"title":["Toward Synergic Learning for Autonomous Manipulation of Deformable Tissues via Surgical Robots: An Approximate Q-Learning Approach"],"prefix":"10.1109","author":[{"given":"Sahba Aghajani","family":"Pedram","sequence":"first","affiliation":[]},{"given":"Peter Walker","family":"Ferguson","sequence":"additional","affiliation":[]},{"given":"Changyeob","family":"Shin","sequence":"additional","affiliation":[]},{"given":"Ankur","family":"Mehta","sequence":"additional","affiliation":[]},{"given":"Erik P.","family":"Dutson","sequence":"additional","affiliation":[]},{"given":"Farshid","family":"Alambeigi","sequence":"additional","affiliation":[]},{"given":"Jacob","family":"Rosen","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref33","volume":"3","author":"hearn","year":"2004","journal-title":"Computer Graphics with OpenGL"},{"key":"ref32","article-title":"Opencv","volume":"3","author":"bradski","year":"2000","journal-title":"Dr Dobb&#x2019;s J Softw Tools"},{"key":"ref31","first-page":"496","article-title":"The chai libraries","author":"conti","year":"2003","journal-title":"Proc of Eurohaptics 2003"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/WACV.2017.58"},{"key":"ref34","first-page":"91","article-title":"Faster r-cnn: Towards real-time object detection with region proposal networks","author":"ren","year":"2015","journal-title":"Advances in neural information processing systems"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2018.2863376"},{"key":"ref11","first-page":"1097","article-title":"Imagenet classification with deep convolutional neural networks","author":"krizhevsky","year":"2012","journal-title":"Advances in neural information processing systems"},{"key":"ref12","first-page":"1334","article-title":"End-to-end training of deep visuomotor policies","volume":"17","author":"levine","year":"2016","journal-title":"The Journal of Machine Learning Research"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1017\/S0263574799002362"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1016\/j.rcim.2011.08.002"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8794159"},{"key":"ref16","article-title":"Scade: Simultaneous sensor calibration and deformation estimation of fbg-equipped unmodeled continuum manipulators","author":"alambeigi","year":"2019","journal-title":"IEEE Transactions on Robotics"},{"key":"ref17","author":"bishop","year":"2006","journal-title":"Pattern Recognition and Machine Learning"},{"key":"ref18","doi-asserted-by":"crossref","DOI":"10.1609\/aaai.v24i1.7727","article-title":"Relative entropy policy search","author":"peters","year":"2010","journal-title":"Twenty-Fourth AAAI Conference on Artificial Intelligence"},{"key":"ref19","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1561\/2300000021","article-title":"A survey on policy search for robotics","volume":"2","author":"deisenroth","year":"2013","journal-title":"Foundations and Trends in Robotics"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ICMLC.2010.38"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1126\/scitranslmed.aad9398"},{"key":"ref27","author":"rivlin","year":"2003","journal-title":"An Introduction to the Approximation of Functions"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2016.7487611"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2018.2888896"},{"key":"ref29","article-title":"Playing atari with deep reinforcement learning","author":"mnih","year":"2013","journal-title":"arXiv preprint arXiv 1312 5602"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1007\/s10439-018-2074-y"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1111\/j.1749-4486.2008.01703.x"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2015.7139344"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2017.7989278"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TMRB.2019.2895780"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/11566489_12"},{"key":"ref20","first-page":"2829","article-title":"Continuous deep q-learning with model-based acceleration","author":"gu","year":"2016","journal-title":"International Conference on Machine Learning"},{"key":"ref22","author":"watkins","year":"1989","journal-title":"Learning from delayed rewards"},{"key":"ref21","doi-asserted-by":"crossref","first-page":"279","DOI":"10.1007\/BF00992698","article-title":"Q-learning","volume":"8","author":"watkins","year":"1992","journal-title":"Machine Learning"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TRO.2016.2533639"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1177\/0278364913495721"},{"key":"ref26","volume":"135","author":"sutton","year":"1998","journal-title":"Introduction to Reinforcement Learning"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/TBME.2012.2228858"}],"event":{"name":"2020 8th IEEE RAS\/EMBS International Conference for Biomedical Robotics and Biomechatronics (BioRob)","location":"New York City, NY, USA","start":{"date-parts":[[2020,11,29]]},"end":{"date-parts":[[2020,12,1]]}},"container-title":["2020 8th IEEE RAS\/EMBS International Conference for Biomedical Robotics and Biomechatronics (BioRob)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9219774\/9224269\/09224421.pdf?arnumber=9224421","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,11,23]],"date-time":"2022-11-23T13:47:10Z","timestamp":1669211230000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9224421\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,11]]},"references-count":34,"URL":"https:\/\/doi.org\/10.1109\/biorob49111.2020.9224421","relation":{},"subject":[],"published":{"date-parts":[[2020,11]]}}}