Low et al. "Sample-Efficient Iterative Lower Bound Optimization of Deep Reactive Policies for Planning in Continuous MDPs." AAAI Conference on Artificial Intelligence, 2022. doi:10.1609/AAAI.V36I9.21220
Markdown
[Low et al. "Sample-Efficient Iterative Lower Bound Optimization of Deep Reactive Policies for Planning in Continuous MDPs." AAAI Conference on Artificial Intelligence, 2022.](https://mlanthology.org/aaai/2022/low2022aaai-sample/) doi:10.1609/AAAI.V36I9.21220
BibTeX
@inproceedings{low2022aaai-sample,
title = {{Sample-Efficient Iterative Lower Bound Optimization of Deep Reactive Policies for Planning in Continuous MDPs}},
author = {Low, Siow Meng and Kumar, Akshat and Sanner, Scott},
booktitle = {AAAI Conference on Artificial Intelligence},
year = {2022},
pages = {9840-9848},
doi = {10.1609/AAAI.V36I9.21220},
url = {https://mlanthology.org/aaai/2022/low2022aaai-sample/}
}