{
    "embed_dim": 1024,
    "audio_cfg": {
        "arch": "ResNet38",
        "cnn_pretrained": true,
        "freeze": false
    },
    "text_cfg": {
        "model_type": "bert-base-uncased",
        "freeze": false
    }
}