Keywords: stochastic games; Nash equilibrium; Markov decision processes; total rewards
@article{10_14736_kyb_2019_1_0152,
author = {Gonz\'alez-Padilla, Francisco J. and Montes-de-Oca, Ra\'ul},
title = {Nash {{\Large} $\epsilon $}-equilibria for stochastic games with total reward functions: an approach through {Markov} decision processes},
journal = {Kybernetika},
pages = {152--165},
year = {2019},
volume = {55},
number = {1},
doi = {10.14736/kyb-2019-1-0152},
mrnumber = {3935419},
zbl = {07088883},
language = {en},
url = {http://geodesic.mathdoc.fr/articles/10.14736/kyb-2019-1-0152/}
}
TY - JOUR
AU - González-Padilla, Francisco J.
AU - Montes-de-Oca, Raúl
TI - Nash {\Large $\epsilon $}-equilibria for stochastic games with total reward functions: an approach through Markov decision processes
JO - Kybernetika
PY - 2019
SP - 152
EP - 165
VL - 55
IS - 1
UR - http://geodesic.mathdoc.fr/articles/10.14736/kyb-2019-1-0152/
DO - 10.14736/kyb-2019-1-0152
LA - en
ID - 10_14736_kyb_2019_1_0152
ER -
%0 Journal Article
%A González-Padilla, Francisco J.
%A Montes-de-Oca, Raúl
%T Nash {\Large $\epsilon $}-equilibria for stochastic games with total reward functions: an approach through Markov decision processes
%J Kybernetika
%D 2019
%P 152-165
%V 55
%N 1
%U http://geodesic.mathdoc.fr/articles/10.14736/kyb-2019-1-0152/
%R 10.14736/kyb-2019-1-0152
%G en
%F 10_14736_kyb_2019_1_0152
González-Padilla, Francisco J.; Montes-de-Oca, Raúl. Nash {\Large $\epsilon $}-equilibria for stochastic games with total reward functions: an approach through Markov decision processes. Kybernetika, Tome 55 (2019) no. 1, pp. 152-165. doi: 10.14736/kyb-2019-1-0152
[1] Aliprantis, C. D., Border, K. C.: Infinite Dimensional Analysis. Springer 2006. | MR | Zbl
[2] Ash, R. B.: Real Analysis and Probability. Academic Press, New York 1972. | MR
[3] Bartle, R.: The Elements of Real Analysis. John Wiley and Sons, Inc. 1964. | DOI | MR
[4] Cavazos-Cadena, R., Montes-de-Oca, R.: Optimal and nearly optimal policies in Markov decision chains with nonnegative rewards and risk-sensitive expected total-reward criterion. In: Markov Processes and Controlled Markov Chains 2002 (Z. Hou, J. A. Filar and A. Chen, eds.), Kluwer Academic Publishers, pp. 189-221. | DOI | MR
[5] Filar, J., Vrieze, K.: Competitive Markov Decision Processes. Springer-Verlag, New York 1997. | MR
[6] Habil, E. D.: Double sequences and double series. The Islamic Univ. J., Series of Natural Studies and Engineering 14 (2006), 1-32. (This reference is available at the Islamic University Journal's site: http://journal.iugaza.edu.ps/index.php/IUGNS/article/view/1594/1525.)
[7] Hernández-Lerma, O., Lasserre, J. B.: Discrete-Time Markov Control Processes: Basic Optimality Criteria. Springer-Verlag, New York 1996. | DOI | MR | Zbl
[8] Hordijk, A.: Dynamic Programming and Markov Potential Theory. Mathematical Centre Tracts 51, Amsterdam 1974. | MR
[9] Jaśkiewicz, A., Nowak, A. S.: Stochastic games with unbounded payoffs: Applications to robust control in Economics. Dyn. Games Appl. 1 (2011), 2, 253-279. | DOI | MR
[10] Kakutani, S.: A generalization of Brouwer's fixed point theorem. Duke Math. J. 8 (1942), 457-459. | DOI | MR
[11] Kelley, J. L.: General Topology. Springer, New York 1955. | MR
[12] Köthe, G.: Topological Vector Spaces I. Springer-Verlag, 1969. | MR
[13] Puterman, M.: Markov Decision Processes. John Wiley and Sons, Inc. New Jersey 1994. | MR | Zbl
[14] Shapley, L. S.: Stochastic games. Proc. Nat. Acad. Sci. U. S. A. 39 (1953), 1095-1100. | DOI | MR | Zbl
[15] Thuijsman, F.: Optimality and Equilibria in Stochastic Games. CW1 Tract-82, Amsterdam 1992. | MR
[16] Zeidler, E.: Nonlinear Functional Analysis and its Applications. Springer-Verlag, New York Inc. 1988. | MR
Cité par Sources :