hydra:
  run:
    dir: outputs/${now:%Y-%m-%d}/${hydra.job.name}/${now:%H-%M-%S}
  job:
    chdir: True
    name: pretraining

num_gpus: 4 
num_nodes: 1
save_path: output
optimizer: AdamW
lr: 1.0e-06
batch_size: 1024
n_epochs: 2000
log_every_n_steps: 1
check_val_every_n_epoch: 100
encoder_name: cgcnn
hf_textencoder_model_id: allenai/scibert_scivocab_uncased
max_token_length: 64
embedding_dim: 768
embedding_normalize: l2
textmlp_n_layers: 3
textmlp_hidden_dim: 768
textmlp_dropout_prob: 0.0
n_conv_cgcnn: 5
crystalencoder_n_mlp_layers: 2
crystalencoder_dropout_prob: 0.0
loss_fn: cosface_loss
clip_loss_temperature: 1.0
margin: 0.5
loss_scale: 3
train_percent_check: 1.0
val_percent_check: 1.0
model_checkpoint_save_top_k: -1
resume_ckpt_path: null
dataset_cache_dir: /data/cod_20240907_abst_exist
input_pickle_path: /data/cod_metadata_20240907.csv
dataset_load_in_memory: true
cod_basepath: /cod
caption_json_path: /workspace/generated_data/cod_full_20240331_full_meta-llamaLlama-3_1-8B-Instruct.json
pretrain_dataset_cache_dir: /workspace/data/cod_full_20240331_full_meta-llamaLlama-3_1-8B-Instruct_ft
freeze_text_encoders: true
attention: baseline
num_attention_layers: 4