# general
seed: 1908

# dataset
train_cnt: 20000
val_cnt: 1000
val_ratio: 0.05
data_path: data_path
prefix_path: prefix_path
batch_size: 16

# train
lr: 5e-5
dec_lr: 1e-3
epoch: 5
print_steps: 0.1
alpha1: 0.4
alpha2: 0.4
orth_alpha: 5
recon_alpha: 5

# model
model_name: gpt-j
model_path: model_path
hidden_dims:
  - 4096
  - 4096
from_layer: 8
to_layer: 8
module_tmp: transformer.h.{}
layer_tmp: transformer.h.{}
relation_layer: 18

# experiment
exp_name: run
exp_dsc: contrastive v4 - data_v2
