Pietquin et al. "Sample Efficient On-Line Learning of Optimal Dialogue Policies with Kalman Temporal Differences." International Joint Conference on Artificial Intelligence, 2011. doi:10.5591/978-1-57735-516-8/IJCAI11-314
Markdown
[Pietquin et al. "Sample Efficient On-Line Learning of Optimal Dialogue Policies with Kalman Temporal Differences." International Joint Conference on Artificial Intelligence, 2011.](https://mlanthology.org/ijcai/2011/pietquin2011ijcai-sample/) doi:10.5591/978-1-57735-516-8/IJCAI11-314
BibTeX
@inproceedings{pietquin2011ijcai-sample,
title = {{Sample Efficient On-Line Learning of Optimal Dialogue Policies with Kalman Temporal Differences}},
author = {Pietquin, Olivier and Geist, Matthieu and Chandramohan, Senthilkumar},
booktitle = {International Joint Conference on Artificial Intelligence},
year = {2011},
pages = {1878-1883},
doi = {10.5591/978-1-57735-516-8/IJCAI11-314},
url = {https://mlanthology.org/ijcai/2011/pietquin2011ijcai-sample/}
}