train:
    seed: 1234
    epochs: 80
    batch_size: 8
    save_every_n_epoch: 2
    precision: 16-mixed
    gradient_clip: 1.0
    if_save_every_weights: true
    if_save_latest: false
    half_weights_save_dir: "GPT_weights/"
    exp_name: "xxx"
optimizer:
    lr: 0.01
    lr_init: 0.00001
    lr_end: 0.0001
    warmup_steps: 2000
    decay_steps: 40000
data:
    max_eval_sample: 8
    max_sec: 54
    num_workers: 2
    pad_val: 1024 # same with EOS in model
model:
    vocab_size: 1025
    phoneme_vocab_size: 512
    embedding_dim: 512
    hidden_dim: 512
    head: 16
    linear_units: 2048
    n_layer: 24
    dropout: 0
    EOS: 1024
    random_bert: 0
inference:
    top_k: 5

train_semantic_path: "logs/xxx/6-name2semantic.tsv"
train_phoneme_path: "logs/xxx/2-name2text.txt"
dev_semantic_path: "logs/xxx/6-name2semantic-dev.tsv"
dev_phoneme_path: "logs/xxx/2-name2text-dev.txt"
output_dir: "logs/xxx/logs_s1"