

python -m scripts.train_ipo.py configs/training_ipo.yml --tag ipo_reward
