Zhang et al. "UNEX-RL: Reinforcing Long-Term Rewards in Multi-Stage Recommender Systems with UNidirectional EXecution." AAAI Conference on Artificial Intelligence, 2024. doi:10.1609/AAAI.V38I8.28783
Markdown
[Zhang et al. "UNEX-RL: Reinforcing Long-Term Rewards in Multi-Stage Recommender Systems with UNidirectional EXecution." AAAI Conference on Artificial Intelligence, 2024.](https://mlanthology.org/aaai/2024/zhang2024aaai-unex/) doi:10.1609/AAAI.V38I8.28783
BibTeX
@inproceedings{zhang2024aaai-unex,
title = {{UNEX-RL: Reinforcing Long-Term Rewards in Multi-Stage Recommender Systems with UNidirectional EXecution}},
author = {Zhang, Gengrui and Wang, Yao and Chen, Xiaoshuang and Qian, Hongyi and Zhan, Kaiqiao and Wang, Ben},
booktitle = {AAAI Conference on Artificial Intelligence},
year = {2024},
pages = {9305-9313},
doi = {10.1609/AAAI.V38I8.28783},
url = {https://mlanthology.org/aaai/2024/zhang2024aaai-unex/}
}