@article{Xie_Zhang_Wang_Xia_Lin_2021, title={Hierarchical Reinforcement Learning for Integrated Recommendation}, volume={35}, url={https://ojs.aaai.org/index.php/AAAI/article/view/16580}, DOI={10.1609/aaai.v35i5.16580}, abstractNote={Integrated recommendation aims to jointly recommend heterogeneous items in the main feed from different sources via multiple channels, which needs to capture user preferences on both item and channel levels. It has been widely used in practical systems by billions of users, while few works concentrate on the integrated recommendation systematically. In this work, we propose a novel Hierarchical reinforcement learning framework for integrated recommendation (HRL-Rec), which divides the integrated recommendation into two tasks to recommend channels and items sequentially. The low-level agent is a channel selector, which generates a personalized channel list. The high-level agent is an item recommender, which recommends specific items from heterogeneous channels under the channel constraints. We design various rewards for both recommendation accuracy and diversity, and propose four losses for fast and stable model convergence. We also conduct an online exploration for sufficient training. In experiments, we conduct extensive offline and online experiments on a billion-level real-world dataset to show the effectiveness of HRL-Rec. HRL-Rec has also been deployed on WeChat Top Stories, affecting millions of users. The source codes are released in https://github.com/modriczhang/HRL-Rec.}, number={5}, journal={Proceedings of the AAAI Conference on Artificial Intelligence}, author={Xie, Ruobing and Zhang, Shaoliang and Wang, Rui and Xia, Feng and Lin, Leyu}, year={2021}, month={May}, pages={4521-4528} }