%YAML 1.2
---
name: 't74'                  # ideally no spaces
gpu: -1                                 # gpu id to process on

dataset:
  num_chunks: 1000000                   # newest nof chunks to parse
  allow_less_chunks: true
  train_ratio: 0.90                    # trainingset ratio
  # For separated test and train data.
  input_train: '/data/d/ramdisk_fake/dev2/train/' # supports glob
  input_test: '/data/d/ramdisk_fake/dev2/test/'  # supports glob
  input_validation: '/data/d/data/dev2/validate/'
  # For a one-shot run with all data in one directory.
  #input: '/d/data/'

training:
    warmup_steps: 1000
    swa: true
    swa_output: true
    swa_max_n: 10
    swa_steps: 100
    mask_legal_moves: true
    renorm: true
    renorm_max_r: 1.0
    renorm_max_d: 0.0
    q_ratio: 0
    max_grad_norm: 5.4
    batch_size: 1024                   # training batch
    num_batch_splits: 1
    value_focus_min: 1.0               # off initially
    value_focus_slope: 0.0
    test_steps: 500                    # eval test set values after this many steps
    validation_steps: 500                    # eval validation set values after this many steps
    num_test_positions: 40000
    train_avg_report_steps: 200        # training reports its average values after this many steps.
    total_steps: 2000                  # terminate after these steps
    # checkpoint_steps: 10000          # optional frequency for checkpointing before finish
    shuffle_size: 500000               # size of the shuffle buffer
    lr_values:                         # list of learning rates
        - 0.00004
        - 0.00004
    lr_boundaries:                     # list of boundaries
        - 120
    policy_loss_weight: 1.0            # weight of policy loss
    value_loss_weight:  2.0            # weight of value loss
    moves_left_loss_weight: 1.0            # weight of value loss
    path: ''         # network storage dir

model:
  filters: 128
  residual_blocks: 10
  se_ratio: 4
...

