conda create -n VDPO python=3.10
conda activate VDPO
pip install -r requirement.yaml
pip install gymnasium[mujoco]
python3 VDPO.py --env=Ant-v4 --delay=5
@article{wu2024variational,
title={Variational Delayed Policy Optimization},
author={Wu, Qingyuan and Zhan, Simon Sinong and Wang, Yixuan and Wang, Yuhui and Lin, Chung-Wei and Lv, Chen and Zhu, Qi and Huang, Chao},
booktitle={38th Conference on Neural Information Processing Systems},
year={2024}
}