# Main Configuration
cudaDevice: 1

WANDB:
  log: False
  logPolicyStats: False  # setting to False significantly accelerates training
  episodeVisFreq: 800

Model:
  method: 'BT'  # ['BT', 'EIT']
  obsType: 'Image'
  obsMode: '3d_block'  # ['3d_block', 'dlp', '3d_slot']
  numViews: 3
  latentRepPath: 'pre_trained_models/bsa' # [bsa, dlp, osrt]

Reward:
  GT:
    reward_scale: 2.0
    dist_threshold: 0.06  # effective radius of cube
    ori_threshold: 0.5  # ~17 degrees
    clip_reward: True

Training:
  learningRate: 0.0005
  batchSize: 512
  tau: 0.05
  gamma: 0.98
  actionRegCoefficient: 1.0
  bufferSize: [100_000, 100_000]
  totalTimesteps: [3_000_000, 6_000_000]
  epochEpisodes: 800
  warmupEpisodes: 16
  utdRatio: 0.5
  actionNoiseSigma: 0.2
  explorationEpsilon: 0.3

Evaluation:
  numEvalEpisodes: 16
