seed: 42
exp_dir: /cognitive_comp/user/similarity_generation/experiments/
txl_config_path: /cognitive_comp/user/similarity_generation/model_utils/txl_5B_config.json
txl_model_path: /cognitive_comp/user/source/model_base/model_zh/txl_zh_5.0B.pt
opt_model_path: /cognitive_comp/user/source/model_base/model_en/

pretrained_zh: /cognitive_comp/user/source/model_base/pretrained_zh/
pretrained_en: /cognitive_comp/user/source/model_base/pretrained_en/
sp_model_path: /cognitive_comp/user/source/model_base/chinese_sentencepiece/cog-pretrain.model

test_sentence_path: /cognitive_comp/user/source/sim_data/predict_sentences/
test_data_path: /cognitive_comp/user/source/sim_data/sim_test_data/
lab_data_path: /cognitive_comp/user/source/sim_data/sim_train_data/

ckpt_model_path: /cognitive_comp/user/similarity_generation/experiments/lightning_logs/checkpoints/
sim_data_path: /cognitive_comp/user/source/exp_data/sim_cycle_data/
cache_data_path: /cognitive_comp/user/source/exp_data/sim_cycle_cache/

top_k: 0
top_p: 0.95
std_scale: 1.2
repetition_penalty: 1.0

gen_repeat_times: 1  # 每条句子重复生成的次数-zh
dis_batch_size: 32  # en-24 / zh-128  ####
gen_batch_size: 2
gen_big_batch_size: 30
gen_en_batch_size: 24  # pre-4 / 24
pre_gen_bs: 100  # 100-en / zh-512
pre_dis_bs: 96    # en-96 / zh-384

val_me: False
val_check: False
dis_balance: True
dis_use_label: True
warm_up_model: True  ####
pretrain_gen: False  ####
pretrain_dis: False  ####
chinese: 0  ####
consistency: 0

dis_hidden_size: 1024
discriminator_en: albert_xxlarge
discriminator_zh: albert_xxlarge

learning_rate: 2e-5 ##
cycle_num: 10  ####
cycle: -1  ####
idx: -1
start: 0 
end: 0
sentence_num: 5000

gen_train_steps: 400 
dis_train_steps: 600  ####
warmup_steps: 40  ####
es_patience: 1

vae2gen: False
txl2gen: True
