@inproceedings{NEURIPS2020_d3b1fb02, author = {Xu, Ziping and Tewari, Ambuj}, booktitle = {Advances in Neural Information Processing Systems}, editor = {H. Larochelle and M. Ranzato and R. Hadsell and M.F. Balcan and H. Lin}, pages = {18226--18236}, publisher = {Curran Associates, Inc.}, title = {Reinforcement Learning in Factored MDPs: Oracle-Efficient Algorithms and Tighter Regret Bounds for the Non-Episodic Setting}, url = {https://proceedings.neurips.cc/paper_files/paper/2020/file/d3b1fb02964aa64e257f9f26a31f72cf-Paper.pdf}, volume = {33}, year = {2020} }