@inproceedings{NIPS2005_f076073b, author = {Roy, Benjamin}, booktitle = {Advances in Neural Information Processing Systems}, editor = {Y. Weiss and B. Sch\"{o}lkopf and J. Platt}, pages = {}, publisher = {MIT Press}, title = {TD(0) Leads to Better Policies than Approximate Value Iteration}, url = {https://proceedings.neurips.cc/paper_files/paper/2005/file/f076073b2082f8741a9cd07b789c77a0-Paper.pdf}, volume = {18}, year = {2005} }