Grudic and Ungar. "Rates of Convergence of Performance Gradient Estimates Using Function Approximation and Bias in Reinforcement Learning." Neural Information Processing Systems, 2001.
Markdown
[Grudic and Ungar. "Rates of Convergence of Performance Gradient Estimates Using Function Approximation and Bias in Reinforcement Learning." Neural Information Processing Systems, 2001.](https://mlanthology.org/neurips/2001/grudic2001neurips-rates/)
BibTeX
@inproceedings{grudic2001neurips-rates,
title = {{Rates of Convergence of Performance Gradient Estimates Using Function Approximation and Bias in Reinforcement Learning}},
author = {Grudic, Gregory Z. and Ungar, Lyle H.},
booktitle = {Neural Information Processing Systems},
year = {2001},
pages = {1515-1522},
url = {https://mlanthology.org/neurips/2001/grudic2001neurips-rates/}
}