{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,13]],"date-time":"2026-06-13T16:03:00Z","timestamp":1781366580269,"version":"3.54.1"},"reference-count":31,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,2,22]],"date-time":"2024-02-22T00:00:00Z","timestamp":1708560000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,2,22]],"date-time":"2024-02-22T00:00:00Z","timestamp":1708560000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,2,22]]},"DOI":"10.1109\/icara60736.2024.10553186","type":"proceedings-article","created":{"date-parts":[[2024,6,18]],"date-time":"2024-06-18T13:29:21Z","timestamp":1718717361000},"page":"285-293","source":"Crossref","is-referenced-by-count":1,"title":["Applying Reinforcement Learning to PID Flight Control of a Quadrotor Drone to Mitigate Wind Disturbances"],"prefix":"10.1109","author":[{"given":"Ryan J.","family":"Hoover","sequence":"first","affiliation":[{"name":"Point Park University,Department of Natural Sciecnes and Engineering,Pittsburgh,PA,USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Wenyu","family":"Wu","sequence":"additional","affiliation":[{"name":"Carnegie Mellon University,Department of Mechanical Engineering,Pittsburgh,PA,USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Kenji","family":"Shimada","sequence":"additional","affiliation":[{"name":"Carnegie Mellon University,Department of Mechanical Engineering,Pittsburgh,PA,USA"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-77939-9_2"},{"key":"ref2","volume-title":"Crazyflie 2.1. Bitcraze","year":"2022"},{"key":"ref3","volume-title":"Crazyflie Firmware. Bitcraze","year":"2022"},{"key":"ref4","volume-title":"PX4 Controller Diagrams","year":"2022"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.3390\/electronics10090999"},{"key":"ref6","article-title":"Proximal policy optimization algorithms","author":"John","year":"2017","journal-title":"arXiv preprint"},{"key":"ref7","first-page":"1889","article-title":"Trust region policy optimization","volume-title":"International conference on machine learning","author":"John"},{"key":"ref8","article-title":"Continuous control with deep reinforcement learning","author":"Lillicrap","year":"2015","journal-title":"arXiv preprint"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1145\/3301273"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-77939-9_2"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2005.1545025"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2016.7487175"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2017.2720851"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1177\/0142331217713837"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/IBSSC47189.2019.8973068"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.23919\/CCC50068.2020.9188426"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2016.7487170"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/AERO.2012.6187314"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1016\/j.oceaneng.2010.02.013"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/IROS51168.2021.9635857"},{"key":"ref21","volume-title":"Pybullet, a python module for physics simulation for games, robotics and machine learning","author":"Coumans","year":"2016"},{"key":"ref22","article-title":"Design of a trajectory tracking controller for a nanoquadcopter","author":"Luis","year":"2016","journal-title":"arXiv preprint"},{"key":"ref23","volume-title":"System identification of the crazyflie 2.0 nano quadrocopter","author":"F\u00f6rster","year":"2015"},{"key":"ref24","volume-title":"Planning and control for quadrotor flight through cluttered environments","author":"Landry","year":"2015"},{"key":"ref25","volume-title":"Stable baselines3","author":"Raffin","year":"2021"},{"key":"ref26","article-title":"Flightmare: A flexible quadrotor simulator","author":"Song","year":"2020","journal-title":"arXiv preprint"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-67361-5_40"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-20190-6_4"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1145\/3466618"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/IROS40897.2019.8967695"},{"key":"ref31","first-page":"1861","article-title":"Soft actor-critic: Off-policy maximum entropy deep reinforcement learning with a stochastic actor","volume-title":"International conference on machine learning","author":"Haarnoja"}],"event":{"name":"2024 10th International Conference on Automation, Robotics and Applications (ICARA)","location":"Athens, Greece","start":{"date-parts":[[2024,2,22]]},"end":{"date-parts":[[2024,2,24]]}},"container-title":["2024 10th International Conference on Automation, Robotics and Applications (ICARA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10552867\/10552915\/10553186.pdf?arnumber=10553186","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,17]],"date-time":"2025-11-17T18:37:29Z","timestamp":1763404649000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10553186\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,2,22]]},"references-count":31,"URL":"https:\/\/doi.org\/10.1109\/icara60736.2024.10553186","relation":{},"subject":[],"published":{"date-parts":[[2024,2,22]]}}}