Tsitsiklis and Van Roy. "On Average Versus Discounted Reward Temporal-Difference Learning." Machine Learning, 2002. doi:10.1023/A:1017980312899
Markdown
[Tsitsiklis and Van Roy. "On Average Versus Discounted Reward Temporal-Difference Learning." Machine Learning, 2002.](https://mlanthology.org/mlj/2002/tsitsiklis2002mlj-average/) doi:10.1023/A:1017980312899
BibTeX
@article{tsitsiklis2002mlj-average,
title = {{On Average Versus Discounted Reward Temporal-Difference Learning}},
author = {Tsitsiklis, John N. and Van Roy, Benjamin},
journal = {Machine Learning},
year = {2002},
pages = {179-191},
doi = {10.1023/A:1017980312899},
volume = {49},
url = {https://mlanthology.org/mlj/2002/tsitsiklis2002mlj-average/}
}