Sweep:
  method: grid
  metric:
    goal: minimize
    name: Test/best_rmse
  name: ICLR_PS_data_sweep2d_Forward_T2_In_1_OUT_1
  parameters:
    base_lr:
      values:
      - 0.001
      - 0.005
    moe_topk:
      values: [2,3,4]
    k_p: 
      values: [0.01,0.1,1,5,10,20]
    k_i:
      values: [0.001,0.01,0.1,1]
# baselines

Sweep_config:
  name: ICLR_PS_data_sweep_baseline
data:
  task: 2d_Forward_PS_T2_In_1_OUT_1
load:
  EN: false
  ckpt: FNO_baseline.pt
log_run:
  dot_key_path: Assets/key.env
  group: ICLR_2025_09_24
  name: iclr_ns_dataset_finland1'
  note: just for test 23/9/2024
  project: LE_PDE_ICLR
  tag: findland1
model:
  MOE: False
  PID:
    Enabled: False
    parameters:
      k_i: 0.0
      k_p: 0.0
      lamba_max: 1
      lamba_min: 0.1
      lambda_ini: 0
      moe_ploicy: Stragey_1 #Stragey_2 is topk=4
      target: 0
  name: Baseline.FNO.FNO_Class
  parameters:
    hidden_channels: 6
    in_channels: 1
    ini_prior: None
    moe_gate_input_size:  None # transfomer does not need
    moe_topk: None
    n_modes: [(16,16)]
    out_channels: 1
    scales: 1x1_DC_scale
train:
  Dataset_path: "/root/NC_Dataset/2d/possion2d/low_high_freq.pt"
  MOE_router_loss:
    EN: False
  Sweep_count: 100
  base_lr: 0.001
  batchsize: 4
  currium_sampling:
    EN: false
    ini_value: 0.1
  device: cuda:0
  epochs: 200
  lr_scheduler: CosineAnnealingLR
  milestones: [0,10,20,30,40,50,60,80,100,120,150,180]

  multi_step_loss:
    EN: false
    value: # list
    - 1
    - 0.1
    - 0.1
    - 0.1
  patience: 50
  recon_loss:
    EN: false
  save_dir: Checkpoints/ICLR_2025/Test/PS/Test_PS_0924_Baseline_FNO{16}_Scale_1X1_DC_MOE_raw/
  save_model_name: FNO.pt
  save_name: FNO_check_load_.pt
  train_type: accelerate
