device: cuda
batch_size: 8
grad_accum: 1
max_steps: 15000
huggingface_offline: false
use_bg: true
rgb_only: false
mask_start_step: 1
mask_end_step: ${max_steps}
multiple_groups_enbled: true
num_groups: -1
log_period: 293
use_object_dependent_view: true
llm_init:
  enabled: false
  json_path: null
optimizer:
  type: Adam
  opt_args:
    eps: 1.0e-15
lr:
  mean:
  - 0.005
  - 3.0e-05
  - ${max_steps}
  - exp
  svec:
  - 0.003
  - 0.001
  - ${max_steps}
  - exp
  qvec: 0.003
  color: 0.01
  alpha: 0.003
  bg: 0.003
  object2world_Tvec_for_groups: 0.0
  object2world_scale_scalar_for_groups: 0.0
  object2world_qvec_for_groups: 0.0
init:
  device: ${device}
  type: multiple_groups
  num_groups: ${num_groups}
  restriction_bbox_type: centered_on_object
  init_bbox_ratio: 0.68
  restriction_bbox_ratio: 2.1
  autoencoder_type: CLIPAutoencoder
  subinit:
  - type: shap_e_with_bbox
    restriction_bbox_ratio: 2.1
    prompt: Great Pyramid
    num_points: 12288
    mean_std: 0.8
    svec_val: 0.02
    alpha_val: 0.8
    random_color: true
    facex: true
    xyz_offset:
    - 0
    - 0
    - 0
    part_space_ratios:
    - - - 0.0
        - 0.0
        - 0.0
      - - 0.5
        - 1.0
        - 1.0
    - - - 0.5
        - 0.0
        - 0.0
      - - 1.0
        - 1.0
        - 1.0
    part_specific_guidance_prompts:
    - type: stable_diffusion
      device: ${guidance.device}
      pretrained_model_name_or_path: ${guidance.pretrained_model_name_or_path}
      prompt: A DSLR photo of pyramid shaped burrito
      negative_prompt: ''
      overhead_threshold: 60.0
      front_threshold: 45.0
      back_threshold: 45.0
      use_cache: true
      use_view_dependent_prompt: true
      view_dependent_prompt_front: false
      use_object_dependent_view: ${use_object_dependent_view}
      use_perp_negative: false
      use_prompt_debiasing: false
      debug: false
    - type: stable_diffusion
      device: ${guidance.device}
      pretrained_model_name_or_path: ${guidance.pretrained_model_name_or_path}
      prompt: A DSLR photo of the Great Pyramid made of snow bricks
      negative_prompt: ''
      overhead_threshold: 60.0
      front_threshold: 45.0
      back_threshold: 45.0
      use_cache: true
      use_view_dependent_prompt: true
      view_dependent_prompt_front: false
      use_object_dependent_view: ${use_object_dependent_view}
      use_perp_negative: false
      use_prompt_debiasing: false
      debug: false
eval:
  image_period: ${log_period}
  video_period: ${log_period}
  focus_word_mask_period: ${log_period}
  elevation: 15
  n_frames: 30
  n_circles: 1
  save_format: mp4
  downsample: 1
loss:
  sds: 0.1
  aux_guidance:
  - 2000
  - 0.01
  - 0
  - 2001
  sparsity: 0.0
  opague: 0.0
  z_var: 0.0
  depth_prior: 0.0
  restriction_bbox: 1.0
estimators:
  depth:
    enabled: false
    value: 0.0
  normal:
    enabled: false
    value: 0.0
save_period: 5000
wandb: false
notes: ''
data:
  device: ${device}
  batch_size: ${batch_size}
  max_steps: ${max_steps}
  center:
  - 0.0
  - 0.0
  - 0.0
  center_aug_std: 0.05
  azimuth:
  - -180
  - 180
  azimuth_warmup: 0
  elevation:
  - -20
  - 90
  elevation_real_uniform: true
  elevation_warmup: 0
  camera_distance:
  - 2.8
  - 3.5
  focal:
  - 0.75
  - 1.35
  focal_milestones: null
  reso:
  - 512
  reso_milestones: []
  near_plane: 0.01
  far_plane: 100.0
  stratified_on_azimuth: true
guidance:
  type: stable_diffusion
  max_steps: ${max_steps}
  device: ${device}
  pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5
  keep_complete_pipeline: true
  repeat_until_success: true
  half_precision_weights: true
  use_view_dependent_prompt: true
  use_object_dependent_view: ${use_object_dependent_view}
  enable_attention_slicing: false
  scheduler:
    type: ddim
    args: null
  guidance_scale: 100.0
  weighting_strategy: sds
  min_step_percent: 0.02
  max_step_percent:
  - 2000
  - 0.98
  - 0.5
  - 2001
  grad_clip: null
prompt:
  type: null
renderer:
  semantics:
    enabled: true
  dynamic_camera_distance:
    enabled: false
  restriction_bbox_loss_enabled: true
  restriction_bbox_loss_weight_type: direct_sum
  num_groups: ${num_groups}
  multiple_groups_enbled: ${multiple_groups_enbled}
  device: ${device}
  tile_size: 16
  frustum_culling_radius: 6.0
  tile_culling_type: aabb
  tile_culling_thresh: 0.01
  tile_culling_radius: 6.0
  T_thresh: 0.0001
  skip_frustum_culling: false
  normal_as_rgb: false
  debug: false
  svec_act: exp
  alpha_act: sigmoid
  color_act: sigmoid
  depth_detach: true
  background:
    type: random
    device: ${device}
    range:
    - 0.0
    - 1.0
    random_aug: false
    random_aug_prob: 0.0
  densify:
    enabled: true
    type: compatness
    K: 1
    warm_up: 2000
    end: 10001
    period: 1300
    mean2d_thresh: 0.5
    split_thresh: 0.02
    n_splits: 2
    split_shrink: 0.8
    use_legacy: true
  prune:
    enabled: true
    warm_up: 1999
    end: ${max_steps}
    period: 500
    radii2d_thresh: 0.003
    alpha_thresh: 0.3
    radii3d_thresh: 0.04
  penalty:
    alpha:
      type: center_weighted
      value: 0.0
auxiliary:
  enabled: false
  type: point_e
  device: ${device}
  base_name: base40M-textvec
  weighting_strategy: sds
  guidance_scale: 100
  scheduler_type: original
  batch_size: 4
  min_step_percent: 0.02
  max_step_percent: 0.98
  mean_only: true
  normalize: false
  grad_clip: null
upsample_tune:
  enabled: false
