Bartlett and Baxter. "Estimation and Approximation Bounds for Gradient-Based Reinforcement Learning." Annual Conference on Computational Learning Theory, 2000. doi:10.1006/jcss.2001.1793
Markdown
[Bartlett and Baxter. "Estimation and Approximation Bounds for Gradient-Based Reinforcement Learning." Annual Conference on Computational Learning Theory, 2000.](https://mlanthology.org/colt/2000/bartlett2000colt-estimation/) doi:10.1006/jcss.2001.1793
BibTeX
@inproceedings{bartlett2000colt-estimation,
title = {{Estimation and Approximation Bounds for Gradient-Based Reinforcement Learning}},
author = {Bartlett, Peter L. and Baxter, Jonathan},
booktitle = {Annual Conference on Computational Learning Theory},
year = {2000},
pages = {133-141},
doi = {10.1006/jcss.2001.1793},
url = {https://mlanthology.org/colt/2000/bartlett2000colt-estimation/}
}