# Code for reproducing Variational Delayed Policy Optimization

## 1. requirement
    conda create -n VDPO python=3.10
    conda activate VDPO
    pip install -r requirement.yaml
    pip install gymnasium[mujoco]
## 2. run the VDPO
    python3 VDPO.py --env=Ant-v4 --delay=5