name: "sd-stage1"
tag: "seed${seed}-${rmspace:${system.prompt_processor.prompt},_}"
exp_root_dir: "outputs"
seed: 0

data_type: "random-camera-datamodule"
data:
  batch_size: [1, 1]
  width: [128, 512]
  height: [128, 512]
  resolution_milestones: [5_000]

  camera_distance_range: [1.3, 1.5]
  fovy_range: [40, 65]
  elevation_range: [0, 40]
  eval_camera_distance: 1.5
  eval_fovy_deg: 65.
  n_val_views: 4

  camera_perturb: 0.
  center_perturb: 0.
  up_perturb: 0.

  low_res_prob: 0.1

system_type: "dreamfusion-object-system"
system:
  geometry_type: "implicit-volume"
  geometry:
    radius: 1.0
    normal_type: analytic

    density_bias: "blob_magic3d"
    density_activation: softplus
    density_blob_scale: 10.
    density_blob_std: 0.5

    pos_encoding_config:
      otype: HashGrid
      n_levels: 16
      n_features_per_level: 2
      log2_hashmap_size: 20
      base_resolution: 16
      per_level_scale: 1.447269237440378 # max resolution 4096

  material_type: "diffuse-with-point-light-material"
  material:
    ambient_only_steps: ${trainer.max_steps} # only acitvate when low res
    textureless_prob: 0.5
    ambient_light_color: [0.8, 0.8, 0.8]
    diffuse_light_color: [0.2, 0.2, 0.2]
    soft_shading: true
    albedo_activation: sigmoid

  background_type: "neural-environment-map-background"
  background:
    color_activation: sigmoid
    random_aug: true

  renderer_type: "nerf-volume-renderer-with-budget"
  renderer:
    return_comp_normal: true
    radius: ${system.geometry.radius}
    num_samples_per_ray: 512
    train_gradient_budget: 13_000_000
    train_chunk_size: 32_768

  noise_generator_type: "triplane-noise-generator"
  noise_generator:
    # 0(random)-1(determined)
    sqrt_beta: 1.0
    noise_h: 64
    noise_w: 64
    noise_background_fix: true

    noise_ptc_resolution: 2048
    peel_depth: 4
    apply_transformation: sph2sqr
    context_type: cuda

    smooth_regularization: true
    weight_decay: [5_000, 0.01, 0.0001, 10_000]

  t_scheduler_type: timestep-scheduler
  t_scheduler:
    min_step_percent: 0.02
    max_step_percent: 0.98
    sqrt_anneal: false
    dreamtime_anneal: null
    trainer_max_steps: ${trainer.max_steps}
    linear_anneal_max: [0, 0.3, 0.6, 0.80]
    linear_anneal_min: ${system.t_scheduler.linear_anneal_max}
    linear_anneal_steps: [0, 2_500, 12_500, 25_000]

  prompt_processor_type: "stable-diffusion-prompt-processor"
  prompt_processor:
    pretrained_model_name_or_path: "stabilityai/stable-diffusion-2-1-base"
    prompt: "A 3D model of an adorable cottage with a thatched roof"
    negative_prompt: "lack details, ugly, oversmoothed, bad structure, out of focus, blurry, cartoon, oversaturated, foggy, hazy, bad anatomy, malformed, pixelated obscure, unnatural colors, dull, unclear, lowres, low quality, deformed, dehydrated"
    front_threshold: 30.
    back_threshold: 30.

  guidance_type: "stable-diffusion-unified-guidance"
  guidance:
    weighting_strategy: dmd
    guidance_type: sds
    guidance_stab_type: null
    pretrained_model_name_or_path: "stabilityai/stable-diffusion-2-1-base"
    guidance_scale: 70.
    use_img_loss: null

  loggers:
    wandb:
      enable: false
      project: ${name}
      name: ${tag}

  loss:
    lambda_sd: 1.
    lambda_sd_img: 1e-2
    lambda_normal_smooth: [5_000, 1000., 100., 25_000]
    lambda_3d_normal_smooth: 0.
    lambda_orient: 0.
    lambda_sparsity: 0.
    lambda_opaque: 0.
    lambda_z_variance: 0.

  optimizer:
    name: Adam
    args:
      betas: [0.9, 0.99]
      eps: 1.e-15
    params:
      geometry.encoding:
        lr: 0.01
      geometry.density_network:
        lr: 0.001
      geometry.feature_network:
        lr: 0.001
      background:
        lr: 0.001

trainer:
  max_steps: 25_000
  log_every_n_steps: 50
  num_sanity_val_steps: 0
  val_check_interval: 500
  enable_progress_bar: true
  precision: 16-mixed

checkpoint:
  save_last: true # save at each validation time
  save_top_k: -1
  every_n_train_steps: ${trainer.max_steps}
