image_reward:
  model_ckpt_path: /mnt/d/hytidel/model/THUDM/ImageReward/ImageReward.pt
  
  clip_range: [-2, 2]

  bias_constant: 2.0
  norm_constant: 1.0
