Constrained Control of Large Graph-based MDPs Under Measurement Uncertainty
@article{haksar_constrained_2023,
title = {Constrained {Control} of {Large} {Graph}-based {MDPs} {Under} {Measurement} {Uncertainty}},
issn = {0018-9286, 1558-2523, 2334-3303},
url = {https://ieeexplore.ieee.org/document/10037206/},
abstract = {We consider controlling a graph-based Markov decision process (GMDP) with a control capacity constraint given only uncertain measurements of the underlying state. We also consider two special structural properties of GMDPs, called Anonymous Influence and Symmetry. Large-scale spatial processes such as forest wildfires, disease epidemics, opinion dynamics, and robot swarms are well-modeled by GMDPs with these properties. We adopt a certainty-equivalence approach and derive efficient and scalable algorithms for estimating the GMDP state given uncertain measurements, and for computing approximately optimal control policies given a maximumlikelihood state estimate. We also derive sub-optimality bounds for our estimation and control algorithms. Unlike prior work, our methods scale to GMDPs with large state-spaces and explicitly enforce a control constraint. We demonstrate the effectiveness of our estimation and control approach in simulations of controlling a forest wildfire using a model with 101192 total states.},
language = {en},
urldate = {2023-08-29},
journal = {IEEE Transactions on Automatic Control},
author = {Haksar, Ravi N. and Schwager, Mac},
year = {2023},
pages = {1--16}
}