@inproceedings{NEURIPS2020_03255088, author = {D\textquotesingle Oro, Pierluca and Ja\'{s}kowski, Wojciech}, booktitle = {Advances in Neural Information Processing Systems}, editor = {H. Larochelle and M. Ranzato and R. Hadsell and M.F. Balcan and H. Lin}, pages = {313--324}, publisher = {Curran Associates, Inc.}, title = {How to Learn a Useful Critic? Model-based Action-Gradient-Estimator Policy Optimization}, url = {https://proceedings.neurips.cc/paper_files/paper/2020/file/03255088ed63354a54e0e5ed957e9008-Paper.pdf}, volume = {33}, year = {2020} }