pretrained_models_path = {
    'bert-base-uncased': 'models/bert-base-uncased',
    'bert-large-uncased':'models/bert-large-uncased',
}

video_feats_map = {
    'video_feats.pkl': 'resnet-50', # mintrec
    'swin_roi.pkl': 'swin-roi',     # mintrec2
}

audio_feats_map = {
    'audio_feats.pkl': 'wav2vec2',  # mintrec
    'wavlm_feats.pkl': 'wavlm',     # mintrec2
}

feat_dims = {
    'text': {
        'bert-base-uncased': 768,
        'bert-large-uncased': 1024
    },
    'video': {
        'resnet-50': 256,
        'swin-roi': 256,  
    },
    'audio': {
        'wavlm': 768,
        'wav2vec2': 768
    }
}