A Blackwell $\epsilon$-optimal strategy in a Markov Decision Process is a strategy that is $\epsilon$-optimal for every discount factor sufficiently close to 1.
¶ We prove the existence of Blackwell $\epsilon$-optimal strategies in finite Markov Decision Processes with partial observation.
@article{1031689022,
author = {Rosenberg, Dinah and Solan, Eilon and Vieille, Nicolas},
title = {Blackwell optimality in Markov decision processes with partial observation},
journal = {Ann. Statist.},
volume = {30},
number = {1},
year = {2002},
pages = { 1178-1193},
language = {en},
url = {http://dml.mathdoc.fr/item/1031689022}
}
Rosenberg, Dinah; Solan, Eilon; Vieille, Nicolas. Blackwell optimality in Markov decision processes with partial observation. Ann. Statist., Tome 30 (2002) no. 1, pp. 1178-1193. http://gdmltest.u-ga.fr/item/1031689022/