@misc{baird99reinforcement, added-at = {2008-02-26T12:05:08.000+0100}, author = {Baird, L.}, biburl = {http://www.bibsonomy.org/bibtex/2255f2c6da1a8995e57d60a697219992e/schaul}, citeulike-article-id = {2374771}, description = {idsia}, interhash = {24e2732d3fa83438db516730e095430b}, intrahash = {255f2c6da1a8995e57d60a697219992e}, keywords = {daanbib}, priority = {2}, timestamp = {2008-02-26T12:05:08.000+0100}, title = {Reinforcement Learning Through Gradient Descent}, url = {citeseer.ifi.unizh.ch/baird99reinforcement.html}, year = 1999 }