encoder_configs:
  COVAREP: {type: 'EmbeddedSequenceEncoder', input_size: 74, max_tokens: 1500}
  FACET: {type: 'EmbeddedSequenceEncoder', input_size: 35, max_tokens: 450}
  OpenFace: {type: 'EmbeddedSequenceEncoder', input_size: 713, max_tokens: 450}
  glove_vectors: {type: 'EmbeddedSequenceEncoder', input_size: 300, max_tokens: 50}
modality_config:
  COVAREP: {type: 'embedded_sequence', pad_len: 1500, data_col_name: "data", pad_token: -10000}
  FACET: {type: 'embedded_sequence', pad_len: 450,  data_col_name: "data", pad_token: -10000}
  OpenFace: {type: 'embedded_sequence', pad_len: 450, data_col_name: "data", pad_token: -10000}
  glove_vectors: {type: 'embedded_sequence', pad_len: 50, data_col_name: "data", pad_token: -10000}
num_fusion_tokens: 88
seed: 43
ds_seed: 43
ds_frac: 1.0
predrop: false
batch_size: 8
lr: 0.0001
layers: 5 #12
lr_scheduler_type: "cosine" #constant_with_warmup"
epochs: 32
bimodal_contrastive: False
non_fusion_fcl: False
fcl: False #True
fcl_root: [0,1,2,3]
do_fcl: False
fusion_combos: [4,3,2]
loss_masking: True
zorro: True
no_fusion: False
everything_at_once: False
output_dir: "training_output_23_50_26_02_2024_2_i30"
restart: "training_output_23_50_26_02_2024_2/30"
clip: 2.0
dataset: "data/cmu.dataset"
mean_pool: True
jepa_all: False
