@inproceedings{NEURIPS2020_488e4104, author = {Yang, Mengjiao and Nachum, Ofir and Dai, Bo and Li, Lihong and Schuurmans, Dale}, booktitle = {Advances in Neural Information Processing Systems}, editor = {H. Larochelle and M. Ranzato and R. Hadsell and M.F. Balcan and H. Lin}, pages = {6551--6561}, publisher = {Curran Associates, Inc.}, title = {Off-Policy Evaluation via the Regularized Lagrangian}, url = {https://proceedings.neurips.cc/paper_files/paper/2020/file/488e4104520c6aab692863cc1dba45af-Paper.pdf}, volume = {33}, year = {2020} }