@incollection{wierstraPGC, title = {Policy Gradient Critics}, author = {Daan Wierstra and J\"{u}rgen Schmidhuber}, journal = {Machine Learning: ECML 2007}, pages = {466--477}, year = 2007, url = {http://dx.doi.org/10.1007/978-3-540-74958-5\_43}, id = {2361554}, doi = {10.1007/978-3-540-74958-5\_43}, biburl = {http://www.bibsonomy.org/bibtex/2fbb02eabf0d2dfcceb4cae9d05017e36/idsia}, keywords = {actor-critic, action\_selection, policy\_gradient} }