{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,6]],"date-time":"2026-03-06T19:02:33Z","timestamp":1772823753280,"version":"3.50.1"},"reference-count":42,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2021,1,12]],"date-time":"2021-01-12T00:00:00Z","timestamp":1610409600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,1,12]],"date-time":"2021-01-12T00:00:00Z","timestamp":1610409600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Syst Sci Complex"],"published-print":{"date-parts":[[2021,8]]},"DOI":"10.1007\/s11424-020-9265-y","type":"journal-article","created":{"date-parts":[[2021,1,13]],"date-time":"2021-01-13T03:31:44Z","timestamp":1610508704000},"page":"1401-1425","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":8,"title":["Q-Learning-Based Target Selection for Bearings-Only Autonomous Navigation"],"prefix":"10.1007","volume":"34","author":[{"given":"Kai","family":"Xiong","sequence":"first","affiliation":[]},{"given":"Chunling","family":"Wei","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2021,1,12]]},"reference":[{"key":"9265_CR1","doi-asserted-by":"publisher","first-page":"1381","DOI":"10.1017\/S0373463318000309","volume":"71","author":"S Xin","year":"2018","unstructured":"Xin S, Wang Y, Zheng W, et al., An interplanetary network for spacecraft autonomous navigation, The Journal of Navigation, 2018, 71: 1381\u20131395.","journal-title":"The Journal of Navigation"},{"key":"9265_CR2","first-page":"048001","volume":"4","author":"L Gu","year":"2018","unstructured":"Gu L, Li S, Li W, et al., Comparative study on autonomous navigation for Mars cruise probe based on observability analysis, Journal of Astronomical Telescopes, Instruments, and Systems, 2018, 4: 048001.","journal-title":"Journal of Astronomical Telescopes, Instruments, and Systems"},{"key":"9265_CR3","doi-asserted-by":"publisher","first-page":"1392","DOI":"10.1109\/TAES.2018.2791038","volume":"54","author":"X Ning","year":"2018","unstructured":"Ning X, Gui M, Fang J, et al., A novel autonomous celestial navigation method using solar oscillation time delay measurement, IEEE Transactions on Aerospace and Electronic Systems, 2018, 54: 1392\u20131403.","journal-title":"IEEE Transactions on Aerospace and Electronic Systems"},{"issue":"5","key":"9265_CR4","doi-asserted-by":"publisher","first-page":"1206","DOI":"10.1007\/s11424-018-6096-1","volume":"31","author":"Q Su","year":"2018","unstructured":"Su Q and Huang Y, Observability analysis and navigation algorithm for distributed satellite system using relative range measurements, Journal of Systems Science and Complexity, 2018, 31(5): 1206\u20131226.","journal-title":"Journal of Systems Science and Complexity"},{"key":"9265_CR5","doi-asserted-by":"publisher","first-page":"116","DOI":"10.1016\/j.actaastro.2015.07.027","volume":"117","author":"S G Hesar","year":"2015","unstructured":"Hesar S G, Parker J S, Leonard J M, et al., Lunar far side surface navigation using linked autonomous interplanetary satellite orbit navigation (LiAISON), Acta Astronautica, 2015, 117: 116\u2013129.","journal-title":"Acta Astronautica"},{"key":"9265_CR6","doi-asserted-by":"publisher","first-page":"634","DOI":"10.2514\/1.39499","volume":"33","author":"X Wang","year":"2010","unstructured":"Wang X, Xie J, and Ma S, Starlight atmospheric refraction model for a continuous range of height, Journal of Guidance, Control, and Dynamics, 2010, 33: 634\u2013637.","journal-title":"Journal of Guidance, Control, and Dynamics"},{"key":"9265_CR7","doi-asserted-by":"publisher","first-page":"1489","DOI":"10.1109\/TAES.2017.2671684","volume":"53","author":"X Ning","year":"2017","unstructured":"Ning X, Wang F, and Fang J, An implicit UKF for satellite stellar refraction navigation system, IEEE Transactions on Aerospace and Electronic Systems, 2017, 53: 1489\u20131503.","journal-title":"IEEE Transactions on Aerospace and Electronic Systems"},{"key":"9265_CR8","doi-asserted-by":"publisher","first-page":"192","DOI":"10.2514\/1.G000872","volume":"38","author":"J A Christian","year":"2015","unstructured":"Christian J A, Optical navigation using planet\u2019s centroid and apparent diameter in image, Journal of Guidance, Control, and Dynamics, 2015, 38: 192\u2013204.","journal-title":"Journal of Guidance, Control, and Dynamics"},{"issue":"6","key":"9265_CR9","doi-asserted-by":"publisher","first-page":"1151","DOI":"10.2514\/1.G000575","volume":"38","author":"R R Karimi","year":"2015","unstructured":"Karimi R R and Mortari D, Interplanetary autonomous navigation using visible planets, Journal of Guidance, Control, and Dynamics, 2015, 38(6): 1151\u20131156.","journal-title":"Journal of Guidance, Control, and Dynamics"},{"key":"9265_CR10","doi-asserted-by":"publisher","first-page":"1427","DOI":"10.1017\/S0373463316000424","volume":"69","author":"J Li","year":"2016","unstructured":"Li J, Gao C, Feng T, et al., Error correction of infrared Earth radiance for autonomous navigation, The Journal of Navigation, 2016, 69: 1427\u20131437.","journal-title":"The Journal of Navigation"},{"key":"9265_CR11","doi-asserted-by":"publisher","first-page":"49","DOI":"10.2514\/1.13331","volume":"29","author":"S I Sheikh","year":"2006","unstructured":"Sheikh S I, Pines D J, Wood K S, et al., Spacecraft navigation using X-ray pulsars, Journal of Guidance, Control, and Dynamics, 2006, 29: 49\u201363.","journal-title":"Journal of Guidance, Control, and Dynamics"},{"key":"9265_CR12","doi-asserted-by":"publisher","first-page":"4484","DOI":"10.1109\/TSP.2010.2050479","volume":"58","author":"A A Emadzadeh","year":"2010","unstructured":"Emadzadeh A A and Speyer J L, On modeling and pulse phase estimation of X-ray pulsars, IEEE Transactions on Signal Processing, 2010, 58: 4484\u20134495.","journal-title":"IEEE Transactions on Signal Processing"},{"key":"9265_CR13","doi-asserted-by":"publisher","first-page":"757","DOI":"10.1016\/j.ijleo.2016.10.132","volume":"130","author":"Y Wang","year":"2017","unstructured":"Wang Y, Zheng W, Zhang D, et al., Pulsar profile denosing using kernel regression based on maximum correntropy criterion, Optik, 2017, 130: 757\u2013764.","journal-title":"Optik"},{"key":"9265_CR14","doi-asserted-by":"publisher","first-page":"155","DOI":"10.1017\/S0373463318000632","volume":"72","author":"H Zhang","year":"2019","unstructured":"Zhang H, Jiao R, and Xu L, Orbit determination using pulsar timing data and orientation vector, The Journal of Navigation, 2019, 72: 155\u2013175.","journal-title":"The Journal of Navigation"},{"key":"9265_CR15","doi-asserted-by":"publisher","first-page":"122","DOI":"10.1016\/j.actaastro.2009.12.010","volume":"67","author":"T Chen","year":"2010","unstructured":"Chen T and Xu S, Double line-of-sight measuring relative navigation for spacecraft autonomous rendezvous, Acta Astronautica, 2010, 67: 122\u2013134.","journal-title":"Acta Astronautica"},{"key":"9265_CR16","doi-asserted-by":"publisher","first-page":"1285","DOI":"10.2514\/1.47560","volume":"34","author":"M L Psiaki","year":"2011","unstructured":"Psiaki M L, Absolute oribt and gravity determination using relative position measurements between two satellites, Journal of Guidance, Control, and Dynamics, 2011, 34: 1285\u20131297.","journal-title":"Journal of Guidance, Control, and Dynamics"},{"key":"9265_CR17","doi-asserted-by":"publisher","first-page":"1250","DOI":"10.2514\/1.62476","volume":"37","author":"J Grzymisch","year":"2014","unstructured":"Grzymisch J and Fichter W, Observability criteria and unobservable maneuvers for in-orbit bearing-only navigation, Journal of Guidance, Control, and Dynamics, 2014, 37: 1250\u20131259.","journal-title":"Journal of Guidance, Control, and Dynamics"},{"key":"9265_CR18","doi-asserted-by":"publisher","first-page":"514","DOI":"10.1109\/TAC.2009.2037467","volume":"55","author":"S Kluge","year":"2010","unstructured":"Kluge S, Reif K, and Brokate M, Stochastic stability of the extended Kalman filter with intermittent observations, IEEE Transactions on Automatic Control, 2010, 55: 514\u2013518.","journal-title":"IEEE Transactions on Automatic Control"},{"key":"9265_CR19","first-page":"947","volume":"30","author":"X Zhang","year":"2009","unstructured":"Zhang X, Wang D, and Huang X, Study on the selection of the beacon asteroids in autonomous optical navigation for interplanetary exploration, Journal of Astronautics, 2009, 30: 947\u2013952.","journal-title":"Journal of Astronautics"},{"key":"9265_CR20","doi-asserted-by":"publisher","first-page":"1338","DOI":"10.1109\/TAC.2011.2175070","volume":"57","author":"M F Huber","year":"2012","unstructured":"Huber M F, Optimal pruning for multi-step sensor scheduling, IEEE Transactions on Automatic Control, 2012, 57: 1338\u20131343.","journal-title":"IEEE Transactions on Automatic Control"},{"key":"9265_CR21","doi-asserted-by":"publisher","first-page":"4411","DOI":"10.1109\/TSP.2015.2439239","volume":"63","author":"A Nordio","year":"2015","unstructured":"Nordio A, Tarable A, Dabbene F, et al., Sensor selection and precoding strategies for wireless sensor networks, IEEE Transactions on Signal Processing, 2015, 63: 4411\u20134421.","journal-title":"IEEE Transactions on Signal Processing"},{"key":"9265_CR22","doi-asserted-by":"publisher","first-page":"684","DOI":"10.1109\/TSP.2014.2379662","volume":"63","author":"S Prabhakar","year":"2015","unstructured":"Prabhakar S and Leus G, Sparsity-promoting sensor selection for non-linear measurement models, IEEE Transactions on Signal Processing, 2015, 63: 684\u2013698.","journal-title":"IEEE Transactions on Signal Processing"},{"key":"9265_CR23","doi-asserted-by":"publisher","first-page":"202","DOI":"10.1016\/j.automatica.2016.12.025","volume":"78","author":"H Zhang","year":"2017","unstructured":"Zhang H, Ayoub R, and Sundaram S, Sensor selection for Kalman filtering of linear dynamical systems: Complexity, limitations and greedy algorithms, Automatica, 2017, 78: 202\u2013210.","journal-title":"Automatica"},{"key":"9265_CR24","doi-asserted-by":"publisher","first-page":"1245","DOI":"10.1049\/cje.2017.09.030","volume":"26","author":"J Wang","year":"2017","unstructured":"Wang J, He Z, Zhou H, et al., Optimal weight and parameter estimation of multi-structure and unequal-precision data fusion, Chinese Journal of Electronic, 2017, 26: 1245\u20131253.","journal-title":"Chinese Journal of Electronic"},{"key":"9265_CR25","first-page":"279","volume":"8","author":"C J Watkins","year":"1992","unstructured":"Watkins C J and Dayan P, Q-learning, Machine Learning, 1992, 8: 279\u2013292.","journal-title":"Machine Learning"},{"key":"9265_CR26","doi-asserted-by":"publisher","first-page":"178","DOI":"10.1287\/ijoc.1080.0305","volume":"21","author":"A Gosavi","year":"2009","unstructured":"Gosavi A, Reinforcement learning: A tutorial survey and recent advances, Informs Journal on Computing, 2009, 21: 178\u2013192.","journal-title":"Informs Journal on Computing"},{"key":"9265_CR27","doi-asserted-by":"publisher","first-page":"1238","DOI":"10.1177\/0278364913495721","volume":"32","author":"J Kober","year":"2013","unstructured":"Kober J, Bagnell J A, and Peters J, Reinforcement learning in robotics: A survey, The International Journal of Robotics Research, 2013, 32: 1238\u20131274.","journal-title":"The International Journal of Robotics Research"},{"key":"9265_CR28","doi-asserted-by":"publisher","first-page":"213","DOI":"10.1016\/j.automatica.2018.05.027","volume":"95","author":"S A A Rizvi","year":"2018","unstructured":"Rizvi S A A and Lin Z, Output feedback Q-learning for discrete-time linear zero-sum games with application to the H-infinity control, Automatica, 2018, 95: 213\u2013221.","journal-title":"Automatica"},{"key":"9265_CR29","doi-asserted-by":"publisher","first-page":"1018","DOI":"10.1109\/TAC.2017.2734840","volume":"63","author":"K G Vamvoudakis","year":"2018","unstructured":"Vamvoudakis K G and Hespanha J P, Cooperative Q-learning for rejection of persistent adversarial inputs in networked linear quadratic systems, IEEE Transactions on Automatic Control, 2018, 63: 1018\u20131031.","journal-title":"IEEE Transactions on Automatic Control"},{"key":"9265_CR30","doi-asserted-by":"publisher","first-page":"4953","DOI":"10.1109\/TIE.2017.2772162","volume":"65","author":"B Luo","year":"2018","unstructured":"Luo B, Wu H, and Huang T, Optimal output regulation for model-free quanser helicopter with multistep Q-learning, IEEE Transactions on Industrial Electronics, 2018, 65: 4953\u20134961.","journal-title":"IEEE Transactions on Industrial Electronics"},{"key":"9265_CR31","doi-asserted-by":"publisher","first-page":"1141","DOI":"10.1109\/TSMCA.2012.2227719","volume":"43","author":"A Konar","year":"2013","unstructured":"Konar A, Chakraborty I G, Singh S J, et al., A deterministic improved Q-learning for path planning of a mobile robot, IEEE Transactions on Systems, Man, and Cybernetics: Systems, 2013, 43: 1141\u20131153.","journal-title":"IEEE Transactions on Systems, Man, and Cybernetics: Systems"},{"key":"9265_CR32","doi-asserted-by":"publisher","first-page":"1823","DOI":"10.1109\/TVT.2010.2043124","volume":"59","author":"A Galindo-Serrano","year":"2010","unstructured":"Galindo-Serrano A and Giupponi L, Distributed Q-learning for aggregated interference control in cognitive radio networks, IEEE Transactions on Vehicular Technology, 2010, 59: 1823\u20131834.","journal-title":"IEEE Transactions on Vehicular Technology"},{"key":"9265_CR33","doi-asserted-by":"publisher","first-page":"1224","DOI":"10.1109\/TCYB.2016.2542923","volume":"47","author":"Q Wei","year":"2017","unstructured":"Wei Q, Lewis F L, Sun Q, et al., Discrete-time deterministic Q-learning: A novel convergence analysis, IEEE Transactions on Cybernetics, 2017, 47: 1224\u20131237.","journal-title":"IEEE Transactions on Cybernetics"},{"key":"9265_CR34","doi-asserted-by":"publisher","first-page":"1545","DOI":"10.1109\/TAC.2016.2598476","volume":"62","author":"G Arslan","year":"2017","unstructured":"Arslan G and Yuksel S, Decentralized Q-learning for stochastic teams and games, IEEE Transactions on Automatic Control, 2017, 62: 1545\u20131558.","journal-title":"IEEE Transactions on Automatic Control"},{"key":"9265_CR35","doi-asserted-by":"publisher","first-page":"66","DOI":"10.1016\/j.robot.2017.03.003","volume":"92","author":"A K Sadhu","year":"2017","unstructured":"Sadhu A K and Konar A, Improving the speed of convergence of multi-agent Q-learning for cooperative task-planning by a robot-team, Robotics and Autonomous Systems, 2017, 92: 66\u201380.","journal-title":"Robotics and Autonomous Systems"},{"key":"9265_CR36","doi-asserted-by":"publisher","first-page":"393","DOI":"10.1109\/TSMCC.2010.2055049","volume":"41","author":"H S Ahn","year":"2011","unstructured":"Ahn H S, Jung O, Choi S, et al., An optimal satellite antenna profile using reinforcement learning, IEEE Transactions on System, Man, and Cybernetics \u2014 Part C: Applications and Reviews, 2011, 41: 393\u2013406.","journal-title":"IEEE Transactions on System, Man, and Cybernetics \u2014 Part C: Applications and Reviews"},{"key":"9265_CR37","doi-asserted-by":"publisher","first-page":"247","DOI":"10.1016\/j.procs.2018.10.178","volume":"141","author":"D Kim","year":"2018","unstructured":"Kim D, Lee T, Kim S, et al., Adaptive packet scheduling in IoT environment based on Q-learning, Procedia Computer Science, 2018, 141: 247\u2013254.","journal-title":"Procedia Computer Science"},{"key":"9265_CR38","doi-asserted-by":"publisher","first-page":"1023","DOI":"10.1016\/j.procs.2018.04.248","volume":"131","author":"C Han","year":"2018","unstructured":"Han C, Niu Y, Pang T, et al., Intelligent anti-jamming communication based on the modified Q-learning, Procedia Computer Science, 2018, 131: 1023\u20131031.","journal-title":"Procedia Computer Science"},{"key":"9265_CR39","doi-asserted-by":"publisher","first-page":"137","DOI":"10.1007\/s10994-011-5235-x","volume":"84","author":"R Hafner","year":"2011","unstructured":"Hafner R and Riedmiller M, Reinforcement learning in feedback control, Mach. Learn., 2011, 84: 137\u2013169.","journal-title":"Mach. Learn."},{"key":"9265_CR40","doi-asserted-by":"publisher","first-page":"246","DOI":"10.1016\/j.eswa.2017.11.011","volume":"100","author":"A Martinez-Tenor","year":"2018","unstructured":"Martinez-Tenor A, Antonio J, Fernandez-Madrigal A, et al., Towards a common implementation of reinforcement learning for multiple robotic tasks, Expert Systems with Applications, 2018, 100: 246\u2013259.","journal-title":"Expert Systems with Applications"},{"key":"9265_CR41","doi-asserted-by":"publisher","first-page":"2042","DOI":"10.1109\/TNNLS.2017.2773458","volume":"29","author":"B Kiumarsi","year":"2018","unstructured":"Kiumarsi B, Vamvoudakis K G, Modares H, et al., Optimal and autonomous control using reinforcement learning: A survey, IEEE Transactions on Neural Networks and Learning Systems, 2018, 29: 2042\u20132062.","journal-title":"IEEE Transactions on Neural Networks and Learning Systems"},{"key":"9265_CR42","doi-asserted-by":"publisher","first-page":"587","DOI":"10.1109\/TAES.2002.1008988","volume":"38","author":"C C Liebe","year":"2002","unstructured":"Liebe C C, Accuracy performance of star trackers \u2014 A tutorial, IEEE Transactions on Aerospace and Electronic Systems, 2002, 38: 587\u2013599.","journal-title":"IEEE Transactions on Aerospace and Electronic Systems"}],"container-title":["Journal of Systems Science and Complexity"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11424-020-9265-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11424-020-9265-y\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11424-020-9265-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,8,10]],"date-time":"2021-08-10T10:03:02Z","timestamp":1628589782000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11424-020-9265-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,1,12]]},"references-count":42,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2021,8]]}},"alternative-id":["9265"],"URL":"https:\/\/doi.org\/10.1007\/s11424-020-9265-y","relation":{},"ISSN":["1009-6124","1559-7067"],"issn-type":[{"value":"1009-6124","type":"print"},{"value":"1559-7067","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,1,12]]},"assertion":[{"value":"23 September 2019","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 June 2020","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 January 2021","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}