@inproceedings{5a7cf6b785ee427aa28514814d4834a5,
title = "Robust spacecraft hovering near small bodies in environments with unknown dynamics using reinforcement learning",
abstract = "Autonomous close proximity operations (including hovering and landing) in the lowgravity environment exhibited by asteroids are particularly challenging. Current approaches to this problem require knowledge of the environmental dynamics in the asteroid's vicinity. This knowledge is costly, both in terms of time and money, to acquire. This paper uses reinforcement learning (RL) to develop a novel non-linear hovering controller with sufficient robustness to allow precision hovering in unknown environments, limited only by the maximum thrust requirements imposed by the environment. We demonstrate the robustness of the controller by simulating precision hovering in multiple environments that were unknown during the policy optimization. The environments are modeled using non-uniform rotation and a non-uniform gravity field. Simulations were also run using a shape model of the asteroid Itokawa. Performance is compared to that of an RL derived optimal linear PD controller and an LQR controller. Since the hovering controller requires an estimate of the spacecraft's state relative to a landmark on the asteroid's surface, we also introduce an optical seeker based navigation approach that accurately estimates the spacecraft's current state using only a single camera and laser range finder.",
author = "Brian Gaudet and Roberto Furfaro",
year = "2012",
doi = "10.2514/6.2012-5072",
language = "English (US)",
isbn = "9781624101823",
series = "AIAA/AAS Astrodynamics Specialist Conference 2012",
booktitle = "AIAA/AAS Astrodynamics Specialist Conference 2012",
note = "AIAA/AAS Astrodynamics Specialist Conference 2012 ; Conference date: 13-08-2012 Through 16-08-2012",
}