O'Donoghue et al. "Combining Policy Gradient and Q-Learning." International Conference on Learning Representations, 2017. doi:10.1007/978-1-4842-6809-4_8
Markdown
[O'Donoghue et al. "Combining Policy Gradient and Q-Learning." International Conference on Learning Representations, 2017.](https://mlanthology.org/iclr/2017/oaposdonoghue2017iclr-combining/) doi:10.1007/978-1-4842-6809-4_8
BibTeX
@inproceedings{oaposdonoghue2017iclr-combining,
title = {{Combining Policy Gradient and Q-Learning}},
author = {O'Donoghue, Brendan and Munos, Rémi and Kavukcuoglu, Koray and Mnih, Volodymyr},
booktitle = {International Conference on Learning Representations},
year = {2017},
doi = {10.1007/978-1-4842-6809-4_8},
url = {https://mlanthology.org/iclr/2017/oaposdonoghue2017iclr-combining/}
}