Pivazyan and Shoham. "Polynomial-Time Reinforcement Learning of Near-Optimal Policies." AAAI Conference on Artificial Intelligence, 2002.
Markdown
[Pivazyan and Shoham. "Polynomial-Time Reinforcement Learning of Near-Optimal Policies." AAAI Conference on Artificial Intelligence, 2002.](https://mlanthology.org/aaai/2002/pivazyan2002aaai-polynomial/)
BibTeX
@inproceedings{pivazyan2002aaai-polynomial,
title = {{Polynomial-Time Reinforcement Learning of Near-Optimal Policies}},
author = {Pivazyan, Karèn and Shoham, Yoav},
booktitle = {AAAI Conference on Artificial Intelligence},
year = {2002},
pages = {205-210},
url = {https://mlanthology.org/aaai/2002/pivazyan2002aaai-polynomial/}
}