name: "ours-inversion"
tag: "${rmspace:${system.prompt_processor.prompt},_}"
exp_root_dir: "outputs"
seed: 0

data_type: "random-camera-datamodule"
data:
  n_val_views: 50
  n_test_views: 50
  batch_size: [1,1]
  width: [64,512]
  height: [64,512]
  resolution_milestones: [1000]
  camera_distance_range:  [1.95, 2.0] # [1.5, 2.0]
  fovy_range: [60, 70] #[40, 70]
  elevation_range: [-10, 45] #[-10, 45]
  light_sample_strategy: "dreamfusion"
  eval_camera_distance: 2.0
  eval_fovy_deg: 70.

system_type: "ours-inversion-system"
system:
  project_every: 4
  run_test_every: 500
  rescale_additional_losses: -1
  geometry_type: "implicit-volume"
  geometry:
    radius: 2.0
    normal_type: "analytic"
  
    # the density initialization proposed in the DreamFusion paper
    # does not work very well
    # density_bias: "blob_dreamfusion"
    # density_activation: exp
    # density_blob_scale: 5.
    # density_blob_std: 0.2

    # use Magic3D density initialization instead
    density_bias: "blob_magic3d"
    density_activation: softplus
    density_blob_scale: 10.
    density_blob_std: 0.5

    # coarse to fine hash grid encoding
    # to ensure smooth analytic normals
    pos_encoding_config:
      otype: HashGrid
      n_levels: 16
      n_features_per_level: 2
      log2_hashmap_size: 19
      base_resolution: 16
      per_level_scale: 1.447269237440378 # max resolution 4096

  material_type: "diffuse-with-point-light-material"
  material:
    ambient_only_steps: 100000000
    albedo_activation: sigmoid

  background_type: "neural-environment-map-background"
  background:
    color_activation: sigmoid

  renderer_type: "nerf-volume-renderer"
  renderer:
    radius: ${system.geometry.radius}
    num_samples_per_ray: 512
 
  prompt_processor_type: "stable-diffusion-prompt-processor"
  prompt_processor:
    pretrained_model_name_or_path: "stabilityai/stable-diffusion-2-1-base"
    prompt: "A DSLR photo of a white fluffy cat"
    use_perp_neg: true

  guidance_type: "ours-inversion-guidance"
  guidance:
    t_map_power: 1.0
    trainer_max_steps: 10000
    use_legacy_scheduler: true
    inversion_t_threshold: 1000
    sqrt_anneal: true
    pretrained_model_name_or_path: "stabilityai/stable-diffusion-2-1-base"
    guidance_scale: 10.
    inverse_guidance_scale: -10.
    weighting_strategy: sds
    min_step_percent: 0.01
    max_step_percent: 0.98
    ddim_inverse_n_steps: 30
    inversion_eta: 0.3
    back_cfg_scale: 1.0
    linear_inversion_entropy: false
    inversion_entropy_power: 1.0
    use_sds_scaling: false
    prompt_augmentation_cfg_scale: 1.0

  loggers:
    wandb:
      enable: false
      project: "threestudio"
      name: None

  loss:
    lambda_sds: 1.
    lambda_orient: 1000. #[0, 10., 1000., 5000]
    lambda_sparsity: 1.
    lambda_opaque: 0.
    lambda_z_variance: 300.

  optimizer:
    name: Adam
    args:
      lr: 0.01
      betas: [0.9, 0.99]
      eps: 1.e-15
    params:
      geometry:
        lr: 0.01
      background:
        lr: 0.001

trainer:
  max_steps: 10000
  log_every_n_steps: 1
  num_sanity_val_steps: 0
  val_check_interval: 50
  enable_progress_bar: true
  precision: 16-mixed
  accumulate_grad_batches: 1

checkpoint:
  save_last: true # save at each validation time
  save_top_k: -1
  every_n_train_steps: ${trainer.max_steps}
