@inproceedings{094857bdfe7b497f9f1a81ab07c59bf4,
title = "Optimal control of distributed Markov decision processes with network delays",
abstract = "We consider the problem of finding an optimal feedback controller for a network of interconnected subsystems, each of which is a Markov decision process. Each subsystem is coupled to its neighbors via communication links by which signals are delayed but are otherwise transmitted noise-free. One of the subsystems receives input from a controller, and the controller receives delayed statemeasurements from all of the subsystems. We show that an optimal controller requires only a finite amount of memory which does not grow with time, and obtain a bound on the amount of memory that a controller needs to have for each subsystem. This makes the computation of an optimal controller through dynamic programming tractable. We illustrate our result by a numerical example, and show that it generalizes previous results on Markov decision processes with delayed state measurements.",
author = "Sachin Adlakha and Ritesh Madan and Sanjay Lall and Andrea Goldsmith",
year = "2007",
doi = "10.1109/CDC.2007.4434792",
language = "English (US)",
isbn = "1424414989",
series = "Proceedings of the IEEE Conference on Decision and Control",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "3308--3314",
booktitle = "Proceedings of the 46th IEEE Conference on Decision and Control 2007, CDC",
address = "United States",
note = "46th IEEE Conference on Decision and Control 2007, CDC ; Conference date: 12-12-2007 Through 14-12-2007",
}