@misc{baird99reinforcement, title = {Reinforcement Learning Through Gradient Descent}, author = {L. Baird}, url = {citeseer.ifi.unizh.ch/baird99reinforcement.html}, year = {1999}, biburl = {http://www.bibsonomy.org/bibtex/2255f2c6da1a8995e57d60a697219992e/schaul}, description = {idsia}, priority = {2}, citeulike-article-id = {2374771}, keywords = {daanbib } }