@inproceedings{NEURIPS2020_a992995e, author = {Ma, Shaocong and Zhou, Yi and Zou, Shaofeng}, booktitle = {Advances in Neural Information Processing Systems}, editor = {H. Larochelle and M. Ranzato and R. Hadsell and M.F. Balcan and H. Lin}, pages = {14796--14806}, publisher = {Curran Associates, Inc.}, title = {Variance-Reduced Off-Policy TDC Learning: Non-Asymptotic Convergence Analysis}, url = {https://proceedings.neurips.cc/paper_files/paper/2020/file/a992995ef4f0439b258f2360dbb85511-Paper.pdf}, volume = {33}, year = {2020} }