@inproceedings{NEURIPS2022_0b5669c3, author = {Lyu, Jiafei and Ma, Xiaoteng and Li, Xiu and Lu, Zongqing}, booktitle = {Advances in Neural Information Processing Systems}, editor = {S. Koyejo and S. Mohamed and A. Agarwal and D. Belgrave and K. Cho and A. Oh}, pages = {1711--1724}, publisher = {Curran Associates, Inc.}, title = {Mildly Conservative Q-Learning for Offline Reinforcement Learning}, url = {https://proceedings.neurips.cc/paper_files/paper/2022/file/0b5669c3b07bb8429af19a7919376ff5-Paper-Conference.pdf}, volume = {35}, year = {2022} }