# Readout vision - feature inversion on noised features

# model config
model:  
    # model family name
    name: clip-tfm
    # path to the pretrained weights or huggingface model name
    pretrained: "openai/clip-vit-base-patch32"
    # model alias (optional)
    # model_alias:

# experiment name: used for logging and saving results
# results will be saved under output/readout_vision/results/{model_name}/{dataset_name}/{exp_name}/
exp_name: 250608_DIP

# data
data:
  dataset_name: ImageNet
  image_dir: data/images/imagenet-1k-sampled/source
  #image_names:         # lis of image names to use
  #  - "00000"
  image_names_path: data/images/imagenet-1k-sampled/derivatives/image_names_64.yaml  # file with image names to use
  image_ext: ".JPEG"  # image extension with dot, e.g. ".JPEG" or ".jpg"

# noise
noise:
  target_corr_dists:  # target correlation distance for the noise
    - 0.0
    - 0.1
    - 0.2
    - 0.3
    - 0.4
    - 0.5
    - 0.6
    - 0.7
    - 0.8
    - 0.9
    - 0.99
  noise_seeds:   # random seeds for the noise generation
    - 0
  tol: 0.0001  # tolerance for the correlation distance

# batch size
batch_size: 32

# generator
generator:
  name: deepimageprior

# loss function
critic:
  name: mse

# optimizer
optimizer:
  name: adamw
  lr: 0.0001
  scheduler:
    name: LinearLR
    start_factor: 1.0
    end_factor: 0.0

# parameters for the feature inversion pipeline
pipeline:
  num_iterations: 10000
  eval_interval: 1000
  wandb_log_interval: 100

# list of layers to use (human readable names)
# note that reconstruction is performed for each layer separately
layers:
  - layer_0
  - layer_3
  - layer_6
  - layer_9

# human readable layer name to actual layer name
layer_mapping:
  layer_0: vision_model.encoder.layers.0
  layer_1: vision_model.encoder.layers.1
  layer_2: vision_model.encoder.layers.2
  layer_3: vision_model.encoder.layers.3
  layer_4: vision_model.encoder.layers.4
  layer_5: vision_model.encoder.layers.5
  layer_6: vision_model.encoder.layers.6
  layer_7: vision_model.encoder.layers.7
  layer_8: vision_model.encoder.layers.8
  layer_9: vision_model.encoder.layers.9
  layer_10: vision_model.encoder.layers.10
  layer_11: vision_model.encoder.layers.11
  last_projection: visual_projection


# Optional parameters ----------------
# wandb settings (optional)
wandb: True