@inproceedings{NEURIPS2019_de594ef5, author = {QIAN, Jian and Fruit, Ronan and Pirotta, Matteo and Lazaric, Alessandro}, booktitle = {Advances in Neural Information Processing Systems}, editor = {H. Wallach and H. Larochelle and A. Beygelzimer and F. d\textquotesingle Alch\'{e}-Buc and E. Fox and R. Garnett}, pages = {}, publisher = {Curran Associates, Inc.}, title = {Exploration Bonus for Regret Minimization in Discrete and Continuous Average Reward MDPs}, url = {https://proceedings.neurips.cc/paper_files/paper/2019/file/de594ef5c314372edec29b93cab9d72e-Paper.pdf}, volume = {32}, year = {2019} }