model: "ModelUnifiedSimple(ARCroco3DStereoConfig(freeze='none', state_size=768, state_pe='2d', pos_embed='RoPE100',
  rgb_head=True, pose_head=True,  img_size=(224, 224), head_type='linear', output_mode='pts3d+pose',
  depth_mode=('exp', -inf, inf), conf_mode=('exp', 1, inf), pose_mode=('exp', -inf, inf),
  enc_embed_dim=1024, enc_depth=24, enc_num_heads=16, dec_embed_dim=768, dec_depth=12, 
  dec_num_heads=12))"
pretrained: cut3r_224_linear_4.pth
load_only_encoder: False
long_context: False
fixed_length: True
resume: null
benchmark: True
num_views : 4
num_test_views : 4
n_corres_train: 0
n_corres_test: 0

train_criterion: ConfLoss(Regr3DPoseBatchList(L21, norm_mode='?avg_dis'), alpha=0.2)
test_criterion: Regr3DPose(L21, norm_mode='?avg_dis', gt_scale=True, sky_loss_value=0) + Regr3DPose_ScaleInv(L21, norm_mode='?avg_dis', gt_scale=True, sky_loss_value=0)

waymo_train: Waymo_Multi(allow_repeat=False, split=None, ROOT="/workspace/data/preprocessed_cloud_wint/", aug_crop=16, resolution=224, transform=SeqColorJitter, num_views=${num_views}, n_corres=${n_corres_train})
scannet_train: ScanNetpp_Multi(split='train', ROOT="/workspace/data1/scannetpp_processed", aug_crop=16, resolution=224, transform=SeqColorJitter, num_views=${num_views}, n_corres=${n_corres_train})

waymo_test: Waymo_Multi(allow_repeat=False, split=None, ROOT="/workspace/data/preprocessed_cloud_wint/", resolution=224, seed=42, num_views=${num_test_views}, n_corres=${n_corres_test}, train_mode=False)
scannet_test: ScanNetpp_Multi(split='train', ROOT="/workspace/data1/scannetpp_processed", resolution=224, seed=42, num_views=${num_test_views}, n_corres=${n_corres_test}, train_mode=False)
seven_test: SevenScenes_Multi(allow_repeat=False, split=None, ROOT="/workspace/data/seven_scenes/", resolution=224, seed=42, num_views=${num_test_views}, n_corres=${n_corres_test}, train_mode=False)
nrgbd_test: Nrgbd_Multi(allow_repeat=False, split=None, ROOT="/workspace/data/nrgbd/", resolution=224, seed=42, num_views=${num_test_views}, n_corres=${n_corres_test}, train_mode=False)
kitti_test: Kitti_Multi(allow_repeat=False, split=None, ROOT="/workspace/data/kitti/depth_selection/val_selection_cropped", resolution=224, seed=42, num_views=${num_test_views}, n_corres=${n_corres_test}, train_mode=False)

train_dataset: 10000 @ ${waymo_train} + 10000 @ ${scannet_train}
test_dataset: 1000 @ ${waymo_test} + 1000 @ ${scannet_test} + 1000 @ ${nrgbd_test} + 1000 @ ${seven_test} + 1000 @ ${kitti_test}

# params match stage2.yaml
seed: 0
batch_size: 6
accum_iter: 1
gradient_checkpointing: false
epochs: 100
start_epoch: 0
weight_decay: 0.05
lr: 5.0e-6
min_lr: 1.0e-06
warmup_epochs: 1
amp: 1

num_workers: 8
world_size: 1
local-rank: -1
dist_url: 'env://'
rank: 0
gpu: 0
distributed: False
dist_backend: 'nccl'

eval_freq: 10
save_freq: 1
keep_freq: 10
print_freq: 100
print_img_freq: 500
num_imgs_vis: 4
save_dir: 'checkpoints'
exp_name: 'unified_simple_stage1_norgb'
task: 'cut3r'
logdir: ./${save_dir}/${exp_name}/logs
output_dir: ./${save_dir}/${exp_name}/
hydra:
  verbose: True
  run:
    dir: ./${save_dir}/${exp_name}

save_code: False
wandb_logger: True

raymap_only: False
rgb_only: True

test_masked: True
