name: LeapHandHora
defaults:
  - AllegroHandHora
env:
  test: False
  reset_height_threshold: 0.625
  # grasp_cache_name: 'public_allegro'
  grasp_cache_name: 'leap'

  reward:
    rotateRewardScale: 1.25
    addAuxPoseGuidance: False
    guidingDeltaRotAngle: 90
    rotAngleThreshold: 15
    auxPoseGuidanceCoef: 1.0
    addTildingTermination: False
    tildingDegreeThreshold: 30.0
    addZRotPenalty: False
    addRotp: False
    rotpCoef: 0.1
    rotpWarmupSteps: 10
    rotpIncreasingSteps: 100

  changeGravityDir: False

  asset:
     handAsset: 'assets/leap_hand/leap_hand_right.urdf'

  object:
    nnInsts: 300

  rotAxis: 'z'
  rotAxisMult: -1

  custmRotAxis: False
  custmRotAxisIdx: 6
  

  

  handType: 'leap'

  handFacingDir: 'up'
  omniWristOrnt: False 
  omniWristHorizontalOrntOnly: False
  omniWristHorizontalOrntRotX: False
  omniWristLowerHalfOnly: False

  handGraspFacingDir: 'palm_down'

  disableObjGravity: False

  adjustableRotVel: False

  scheduleRotVelCoef: True
  rotVelCoefMin: 0.0001
  rotVelCoefMax: 1.0
  scheduleRotVelWarmingUpSteps: 200
  scheduleRotVelIncreasingSteps: 1000

  gravityVal: -9.81
  getFingertipObs: False

  evaluateForStatistics: False
  evaluateGoalConditioned: False
  
  trainGoalConditioned: False
  

  simGravityViaForce: False
  scheduleGravityForce: True
  gravityForceMin: 1.0
  gravityForceMax: 9.8
  scheduleGravityForceWarmingUpSteps: 100
  scheduleGravityForceIncreasingSteps: 200

  scheduleMassUperBound: False
  scheduleMassUperBoundMin: 0.05
  scheduleMassUperBoundMax: 0.25
  scheduleMassUperBoundWarmingUpSteps: 100
  scheduleMassUperBoundIncreasingSteps: 200

  addFingertipStateVelObs: False
  addObjectStateObs: False
  objectDownfacingInitZ: 0.375
  
  addForceObs: False
  addContactForceObs: False
  addContactForceWithBinaryContacts: False
  addObjGoalObservations: False



  customizeGraspPose: False

  usePreoptimizedGraspPose: False 
  preoptimizedGraspPoseFn: ''
  graspToGrasp: False

  handTracking: False
  handTrackingTargetUpdSteps: 50
  applyObjVirtualForce: False
  handTrackingNObj: False

  realToSimAutoTune: False
  realToSimAutoTuneWObj: False

  presetPDGains: False
  presetPDGainsFn: ''

  useOriginalLeapPose: False

  changeRotDir: False
  changeTargetRotDir: 'z'
  changeRotDirPeriod: 200
  changeTargetRotDirMult: 1

  maxEvaluateEnvs: 500000

  addDisturbancesToInitState: False

  recoveryTraining: False
  recoverySuccObjPosThres: 0.001

  randomizeRotDir: False
  usePresetRotDir: False

  addTranslation: False
  translationDir: 'z'
  translationDirMult: 1

  trainActionCompensator: False
  realPlayInfosFn: ''
  actionCompensatorNotUsingRealActions: False
  actionCompensatorNotUseHistory: False
  actionCompensatorWObj: False
  trainActionCompensatorWMotionPred: False
  trainActionCompensatorWMotionPredModelFn: ''


  trainActionCompensatorWRealWM: False # train the compensator with real world model #

  fingertipOnlyActionCompensator: False
  
  actionCompensatorInputJointIdx: -1
  actionCompensatorInputFingerIdx: -1
  actionCompensatorOutputJointIdx: -1
  actionCompensatorOutputFingerIdx: -1

  
  finetuneWithActionCompensator: False 
  actionCompensatorCheckpoint: ''
  compensatorWObjRewType: 'angvel'


  openloopReplay: False
  openloopReplayFolder: ''

  randomStart: False

  
  replayFingerIdx: -1
  replayJointIdx: -1

  optimize_via_fingertip_pos: False
  
  deltaActionScale: 0.020833333333333332

  trainActionCompensatorWFingerRew: False # train the compensator with finger pos as the reward #
  actionCompensatorComputeFingerRew: False # compute the finger pos reward and display it during the training #
  useMaskedActionCompensator: False

  actionCompensatorAddInvActionRew: False
  actionCompensatorInvActionCkptFn: ''
  trainActionCompensatorFreeHand: False


  ##### tune bc model #####
  tuneBCModel: False
  bcModelHistoryLength: 10
  tuneBCviaCompensatorModel: False
  ##### tune bc model #####


  ##### use multiple objects during the training #####
  useMultiObjs: False
  multiObjRandomizeScale: ''
  ##### use multiple objects during the training #####

  

  trainActionCompensatorWResidualWM: False
  useBCBasePolicy: False
  hierarchicalCompensator: False

  actionCompensatorWFullHand: False

  wmPerJoitCompensatorFullHand: False

  output_name: ''

  trainActionCompensatorWRealWMMultiCompensator: False
  numActionCompensator: 1

  specifiedWristOrnt: ''


  enableVhacd: False

  addObjFeatures: False
  objFeatureDim: 64

  lagHistoryBufLength: 3

  evaluateActionAddNoise: False
  evaluateActionNoiseStd: 0.041666666666666664


  trainActionCompensatorUAN: False
  perJointActionCompensator: False

  randomization:
    # # Randomization Property
    # randomizeMass: True
    # randomizeMassLower: 0.01
    # randomizeMassUpper: 0.25
    # randomizeCOM: True
    # randomizeCOMLower: -0.01
    # randomizeCOMUpper: 0.01
    # randomizeFriction: True 
    # randomizeFrictionLower: 0.3 
    # randomizeFrictionUpper: 3.0 
    # randomizeScale: True
    # # if scale_list_init is True, randomizeScaleLower and randomizeScaleUpper is not useful
    # scaleListInit: True
    # randomizeScaleList: [0.8]
    randomizeScaleList: [0.7, 0.72, 0.74, 0.76, 0.78, 0.8, 0.82, 0.84, 0.86]
# task.env.randomization.randomizeScaleList='[0.8]'