name: 'Ours_Visualize'
args:
  embedding_dim: ${backbone.args.encoder_embed_dim}
  matching_loss_weight: 1.0
  avm_pretrain_path: ""
  memory_path: ""
  hook_module_list: ["to_a","to_v"]
  ocm_loss_weight: 1.0
  patch_aff: 0.01
  cand_video_ratio: 0.5
  core_video_ratio: 0.5
  cand_audio_ratio: 0.5
  core_audio_ratio: 0.5
  num_core_audio_times: 4
  frame_select: 'original'
  frame_temperature: 1.0
  mem_args:
    memory_size: 2000