Mahmood and Sutton. "Off-Policy Learning Based on Weighted Importance Sampling with Linear Computational Complexity." Conference on Uncertainty in Artificial Intelligence, 2015.
Markdown
[Mahmood and Sutton. "Off-Policy Learning Based on Weighted Importance Sampling with Linear Computational Complexity." Conference on Uncertainty in Artificial Intelligence, 2015.](https://mlanthology.org/uai/2015/mahmood2015uai-off/)
BibTeX
@inproceedings{mahmood2015uai-off,
title = {{Off-Policy Learning Based on Weighted Importance Sampling with Linear Computational Complexity}},
author = {Mahmood, Ashique Rupam and Sutton, Richard S.},
booktitle = {Conference on Uncertainty in Artificial Intelligence},
year = {2015},
pages = {552-561},
url = {https://mlanthology.org/uai/2015/mahmood2015uai-off/}
}