@inproceedings{bad94bcaa42c4022b27b3e3d21881c39,
title = "Policy gradient approach for dynamic sensor tasking applied to space situational awareness",
abstract = "This paper studies the sensors tasking and management problem for optical Space Object (SO) tracking. The tasking problem is formulated as Markov Decision Process (MDP) and solved using Reinforcement Learning (RL). This RL problem is solved using actor-critic policy gradient approach. This approach is used to find the optimal policy for tasking optical sensors to estimate SO orbits. The reward function is based reducing the uncertainty for the overall catalog to a given upper bound. The reward is negative as long as a SO exist that is about the desired catalog uncertainty. This work tests this approach in simulation and good performance is found using the actor-critic policy gradient approach.",
author = "Richard Linares and Roberto Furfaro",
year = "2017",
language = "English (US)",
isbn = "9780877036371",
series = "Advances in the Astronautical Sciences",
publisher = "Univelt Inc.",
pages = "1247--1257",
editor = "Sims, {Jon A.} and Leve, {Frederick A.} and McMahon, {Jay W.} and Yanping Guo",
booktitle = "Spaceflight Mechanics 2017",
note = "27th AAS/AIAA Space Flight Mechanics Meeting, 2017 ; Conference date: 05-02-2017 Through 09-02-2017",
}