Joseph and Bhatnagar. "An Incremental Off-Policy Search in a Model-Free Markov Decision Process Using a Single Sample Path." Machine Learning, 2018. doi:10.1007/S10994-018-5697-1
Markdown
[Joseph and Bhatnagar. "An Incremental Off-Policy Search in a Model-Free Markov Decision Process Using a Single Sample Path." Machine Learning, 2018.](https://mlanthology.org/mlj/2018/joseph2018mlj-incremental/) doi:10.1007/S10994-018-5697-1
BibTeX
@article{joseph2018mlj-incremental,
title = {{An Incremental Off-Policy Search in a Model-Free Markov Decision Process Using a Single Sample Path}},
author = {Joseph, Ajin George and Bhatnagar, Shalabh},
journal = {Machine Learning},
year = {2018},
pages = {969-1011},
doi = {10.1007/S10994-018-5697-1},
volume = {107},
url = {https://mlanthology.org/mlj/2018/joseph2018mlj-incremental/}
}