@inproceedings{zihan2022near-optimal,
title={Near-Optimal Regret Bounds for Multi-batch Reinforcement Learning},
author={Zihan Zhang, Yuhang Jiang, Yuan Zhou, and Xiangyang Ji},
url={http://archive.ymsc.tsinghua.edu.cn/pacm_paperurl/20230227163550929080748},
booktitle={Conference on Neural Information Processing Systems (NeurIPS)},
year={2022},
}
Zihan Zhang, Yuhang Jiang, Yuan Zhou, and Xiangyang Ji. Near-Optimal Regret Bounds for Multi-batch Reinforcement Learning. 2022. In Conference on Neural Information Processing Systems (NeurIPS). http://archive.ymsc.tsinghua.edu.cn/pacm_paperurl/20230227163550929080748.