python3 train.py --vision_vit_layers 6 --depth_vit_layers 6
python3 train.py --vision_vit_layers 3 --depth_vit_layers 3