Anagnostides et al. "Optimistic Policy Gradient in Multi-Player Markov Games with a Single Controller: Convergence Beyond the Minty Property." AAAI Conference on Artificial Intelligence, 2024. doi:10.1609/AAAI.V38I9.28799
Markdown
[Anagnostides et al. "Optimistic Policy Gradient in Multi-Player Markov Games with a Single Controller: Convergence Beyond the Minty Property." AAAI Conference on Artificial Intelligence, 2024.](https://mlanthology.org/aaai/2024/anagnostides2024aaai-optimistic/) doi:10.1609/AAAI.V38I9.28799
BibTeX
@inproceedings{anagnostides2024aaai-optimistic,
title = {{Optimistic Policy Gradient in Multi-Player Markov Games with a Single Controller: Convergence Beyond the Minty Property}},
author = {Anagnostides, Ioannis and Panageas, Ioannis and Farina, Gabriele and Sandholm, Tuomas},
booktitle = {AAAI Conference on Artificial Intelligence},
year = {2024},
pages = {9451-9459},
doi = {10.1609/AAAI.V38I9.28799},
url = {https://mlanthology.org/aaai/2024/anagnostides2024aaai-optimistic/}
}