Junior et al. "Policy Control with Delayed, Aggregate, and Anonymous Feedback." European Conference on Machine Learning and Principles and Practice of Knowledge Discovery in Databases, 2024. doi:10.1007/978-3-031-70365-2_23
Markdown
[Junior et al. "Policy Control with Delayed, Aggregate, and Anonymous Feedback." European Conference on Machine Learning and Principles and Practice of Knowledge Discovery in Databases, 2024.](https://mlanthology.org/ecmlpkdd/2024/junior2024ecmlpkdd-policy/) doi:10.1007/978-3-031-70365-2_23
BibTeX
@inproceedings{junior2024ecmlpkdd-policy,
title = {{Policy Control with Delayed, Aggregate, and Anonymous Feedback}},
author = {Junior, Guilherme Dinis and Magnússon, Sindri and Hollmén, Jaakko},
booktitle = {European Conference on Machine Learning and Principles and Practice of Knowledge Discovery in Databases},
year = {2024},
pages = {389-406},
doi = {10.1007/978-3-031-70365-2_23},
url = {https://mlanthology.org/ecmlpkdd/2024/junior2024ecmlpkdd-policy/}
}