Perkins. "Reinforcement Learning for POMDPs Based on Action Values and Stochastic Optimization." AAAI Conference on Artificial Intelligence, 2002.
Markdown
[Perkins. "Reinforcement Learning for POMDPs Based on Action Values and Stochastic Optimization." AAAI Conference on Artificial Intelligence, 2002.](https://mlanthology.org/aaai/2002/perkins2002aaai-reinforcement/)
BibTeX
@inproceedings{perkins2002aaai-reinforcement,
title = {{Reinforcement Learning for POMDPs Based on Action Values and Stochastic Optimization}},
author = {Perkins, Theodore J.},
booktitle = {AAAI Conference on Artificial Intelligence},
year = {2002},
pages = {199-204},
url = {https://mlanthology.org/aaai/2002/perkins2002aaai-reinforcement/}
}