Sweep:
  method: grid
  metric:
    goal: minimize
    name: Test/best_rmse
  name: ICLR_PS_data_sweep2d_Forward_T2_In_1_OUT_1
  parameters:
    base_lr:
      values:
      - 0.001
      - 0.005
    moe_topk:
      values: [2,3,4]
    k_p: 
      values: [0.01,0.1,1,5,10,20]
    k_i:
      values: [0.001,0.01,0.1,1]


Sweep_config:
  name: ICLR_PS_data_sweep
data:
  task: 2d_Forward_PS_T2_In_1_OUT_1
load:
  EN: false
  ckpt: PS_multi_scale.pt
log_run:
  dot_key_path: Assets/key.env
  group: ICLR_2025_09_24
  name: iclr_ns_dataset_finland1'
  note: just for test 23/9/2024
  project: LE_PDE_ICLR
  tag: findland1
model:
  MOE: true
  PID:
    Enabled: true
    parameters:
      k_i: 0.02
      k_p: 0.01
      lamba_max: 1
      lamba_min: 0.1
      lambda_ini: 0
      moe_ploicy: Stragey_1 #Stragey_2 is topk=4
      target: 0
  name: Baseline.FNO.FNO_Class
  parameters:
    hidden_channels: 6
    in_channels: 1
    ini_prior: [0,0,0,0] #相当于没有先验
    moe_gate_input_size:  [1,1,128,128] # transfomer does not need
    moe_topk: 3
    n_modes: [(32,32),(128,128),(64,64),(16,16)]
    out_channels: 1
    scales: 4x4_DC_MOE_PID_Pre_scale
train:
  Dataset_path: "/root/NC_Dataset/2d/possion2d/low_high_freq.pt"
  MOE_router_loss:
    EN: true
  Sweep_count: 100
  base_lr: 0.001
  batchsize: 4
  currium_sampling:
    EN: false
    ini_value: 0.1
  device: cuda:0
  epochs: 200
  lr_scheduler: CosineAnnealingLR
  milestones: [0,10,20,30,40,50,60,80,100,120,150,180]

  multi_step_loss:
    EN: false
    value: # list
    - 1
    - 0.1
    - 0.1
    - 0.1
  patience: 50
  recon_loss:
    EN: false
  save_dir: Checkpoints/ICLR_2025/Test/PS/Test_PS_0924_FNO{32_128_64_16}_Scale_4X4_DC_MOE_4_PID_Prior_0000_raw/
  save_model_name: PS_multi_scale.pt
  save_name: PS_multi_scale_check_load_.pt
  train_type: accelerate
