[Mahadevan. "An Average-Reward Reinforcement Learning Algorithm for Computing Bias-Optimal Policies." AAAI Conference on Artificial Intelligence, 1996.](https://mlanthology.org/aaai/1996/mahadevan1996aaai-average/)
@inproceedings{mahadevan1996aaai-average,
title = {{An Average-Reward Reinforcement Learning Algorithm for Computing Bias-Optimal Policies}},
author = {Mahadevan, Sridhar},
booktitle = {AAAI Conference on Artificial Intelligence},
year = {1996},
pages = {875-880},
url = {https://mlanthology.org/aaai/1996/mahadevan1996aaai-average/}
}