@article{baxter2001a, title = {Experiments with Infinite-Horizon, Policy- Gradient Estimation}, author = {J. Baxter and P. Bartlett and L. Weaver}, journal = {Journal of Artificial Intelligence Research}, pages = {351--381}, volume = {15}, year = {2001}, biburl = {http://www.bibsonomy.org/bibtex/216c359f9dac14aaf235b617c3fca6c99/schaul}, description = {idsia}, priority = {2}, citeulike-article-id = {2374785}, keywords = {daanbib, gradients, policy } }