defaults:
  - step_sd3_base_config
  - _self_

dataset: 
  batch_size: 1
  dataset_name: 'yuvalkirstain/pickapic_v1'
  from_disk: False
  constant_timestep: 1
  variable_timestep: True
  keep_only_with_pesudo_preference: False
  filter_strategy: 2
  compare_between_timestep: False
  timestep_interval: 1
  largest_timestep: 951

optimizer:
  lr: 1e-5 

criterion:
  loss_type: score
  batch_coeff: 1.0
  aux_loss_coeff: 1.0

lr_scheduler:
  lr_warmup_steps: 1000

model: 
  pretrained_model_name_or_path: 
  pretrained_vae_name_or_path: 
  logit_scale_init_value: 2.6592 
  score_logit_scale_init_value: 1.0 
  freeze_text_encoder: True
  multi_scale: True
  multi_scale_cfg: False
  guidance_scale: 1.0
  noise_offset: false
  noise_offset_coeff: 0.05

accelerator:
  mixed_precision: BF16
  project_name: reward_model
  resume_from_checkpoint: False
  eval_on_start: False
  metric_name: "accuracy"  # save best ckpt according to this metric
  gradient_accumulation_steps: 1
  max_steps: 200000
  num_epochs: 10
  run_name: 
  save_steps: 5000
  validate_steps: 5000


output_dir: ${accelerator.project_name}/${accelerator.run_name}
hydra:
  run:
    dir: 

debug:
  activate: false
  port: 5900  