@inbook{42c144a8577649599ef0b2c675564e45,
title = "Markov decision processes",
abstract = "We provide a formal description of the discounted reward MDP framework in Chap. 1, including both the finite- and the infinite-horizon settings and summarizing the associated optimality equations. We then present the well-known exact solution algorithms, value iteration and policy iteration, and outline a framework of rolling-horizon control (also called receding-horizon control) as an approximate solution methodology for solving MDPs, in conjunction with simulation-based approaches covered later in the book. We conclude with a brief survey of other recently proposed MDP solution techniques designed to break the curse of dimensionality.",
keywords = "Convolution, Entropy, Prefix",
author = "Chang, \{Hyeong Soo\} and Jiaqiao Hu and Fu, \{Michael C.\} and Marcus, \{Steven I.\}",
note = "Publisher Copyright: {\textcopyright} Springer-Verlag London 2013.",
year = "2013",
doi = "10.1007/978-1-4471-5022-0\_1",
language = "English",
series = "Communications and Control Engineering",
publisher = "Springer International Publishing",
number = "9781447150213",
pages = "1--17",
booktitle = "Communications and Control Engineering",
edition = "9781447150213",
}