@article{KYB_1989_25_3_a0,
author = {Cavazos-Cadena, Rolando},
title = {Weak conditions for the existence of optimal stationary policies in average {Markov} decision chains with unbounded costs},
journal = {Kybernetika},
pages = {145--156},
year = {1989},
volume = {25},
number = {3},
mrnumber = {1010178},
zbl = {0673.90092},
language = {en},
url = {http://geodesic.mathdoc.fr/item/KYB_1989_25_3_a0/}
}
TY - JOUR AU - Cavazos-Cadena, Rolando TI - Weak conditions for the existence of optimal stationary policies in average Markov decision chains with unbounded costs JO - Kybernetika PY - 1989 SP - 145 EP - 156 VL - 25 IS - 3 UR - http://geodesic.mathdoc.fr/item/KYB_1989_25_3_a0/ LA - en ID - KYB_1989_25_3_a0 ER -
Cavazos-Cadena, Rolando. Weak conditions for the existence of optimal stationary policies in average Markov decision chains with unbounded costs. Kybernetika, Tome 25 (1989) no. 3, pp. 145-156. http://geodesic.mathdoc.fr/item/KYB_1989_25_3_a0/
[1] A. Hordijk: Dynamic Programming and Potential Theory. (Mathematical Centre Tract 51.) Mathematisch Centrum, Amsterdam 1974. | MR
[2] D. P. Heyman, M. J. Sobel: Stochastic Models in Operations Research, Vol. II. McGraw-Hill, New York 1984. | Zbl
[3] J. Dugundji: Topology. Allyn and Bacon, Boston 1966. | MR | Zbl
[4] L. C. Thomas: Connectedness conditions for denumerable state Markov decision processes. In: Recent Developments in Markov Decision Processes (Hartley, Thomas, White, eds.), Academic Press, New York 1981, pp. 181-204.
[5] L. I. Sennott: A new condition for the existence of optimal stationary policies in average cost Markov decision processes. Oper. Res. Lett. 5 (1986), 17-23. | MR | Zbl
[6] L. I. Sennott: A new condition for the existence of optimum stationary policies in average cost Markov decision processes -- unbounded cost case. Proceedings of the 25th IEEE Conf. on Dec. and Control, Athens, Greece 1986, pp. 1719-1721.
[7] L. I. Sennott: Average cost optimal stationary policies in infinite state Markov decision processes -- Existence and an algorithm. Submitted (1987).
[8] M. Loève: Probability Theory I. Springer-Verlag, New York--Berlin--Heidelberg 1977. | MR
[9] P. Nain, K. W. Ross: Optimal priority assignement with hard constraints. Submitted to IEEE Trans. Automat. Control (1986). | MR
[10] R. Cavazos-Cadena: Necessary conditions for the optimality equation in average-reward Markov decision processes. Appl. Math. Optim. 19 (1989), 1, 97-112. | MR | Zbl
[11] R. Cavazos-Cadena: Necessary and sufficient conditions for a bounded solution to the optimality equation in average reward Markov decision chains. System Control Lett. 10 (1988), 71-78. | MR | Zbl
[12] R. B. Ash: Real Analysis and Probability. Academic Press, New York 1972. | MR
[13] S. M. Ross: Applied Probability Models with Optimization Applications. Holden-Day, San Francisco 1970. | MR | Zbl
[14] S. M. Ross: Introduction to Stochastic Dynamic Programming. Academic Press, New York 1983. | MR | Zbl