adam_epsilon: 1e-08
add_special_tokens: true
best_metric_type: loss
beta1: 0.9
beta2: 0.98
buffer_size: 10240
classifier_size:
  token_level:
    gene_mask: 2048
    prot_mask: 2048
  span_level:
    gene_type: 128
    prot_homo: 4096
    prot_site: 1024
    prot_domain: 10240
  seq_level:
    gene_taxonomy: 2048
    prot_taxonomy: 2048
    prot_keyword: 2048
  structure_level:
    prot_structure: 128
decay_rate: 0.9
delete_old: false
dev_data_dir: ../dataset/lucagplm/v2.0/dev/
do_eval: true
do_lower_case: false
do_metrics: true
do_test: true
do_train: true
dropout_prob: 0.0
embed_scale: 1.0
evaluate_during_training: true
fp16: false
fp16_opt_level: O1
gene_label_size_dict:
  token_level:
    gene_mask: 39
  span_level:
    gene_type: 8
  seq_level:
    gene_taxonomy: 735
gene_mask_classifier_size: 2048
gene_mask_label_filepath: ../vocab/lucagplm/v2.0/vocab.txt
gene_mask_loss_type: cce
gene_mask_output_mode: multi_class
gene_mask_weight: 1.0
gene_output_keys:
  token_level:
  - gene_mask
  span_level:
  - gene_type
  seq_level:
  - gene_taxonomy
gene_output_mode_dict:
  token_level:
    gene_mask: multi_class
  span_level:
    gene_type: multi_class
  seq_level:
    gene_taxonomy: multi_class
gene_taxonomy_classifier_size: 2048
gene_taxonomy_label_filepath: ../label/lucagplm/v2.0/gene_taxonomy_seq_level_label_v2.txt
gene_taxonomy_loss_type: cce
gene_taxonomy_output_mode: multi_class
gene_taxonomy_weight: 0.2
gene_type_classifier_size: 128
gene_type_label_filepath: ../label/lucagplm/v2.0/gene_type_span_level_label_v2.txt
gene_type_loss_type: cce
gene_type_output_mode: multi_class
gene_type_weight: 0.2
gradient_accumulation_steps: 32
hidden_size: 2560
ignore_index: -100
label_size:
  token_level:
    gene_mask: 39
    prot_mask: 39
  span_level:
    gene_type: 8
    prot_homo: 3443
    prot_site: 946
    prot_domain: 13717
  seq_level:
    gene_taxonomy: 735
    prot_taxonomy: 2196
    prot_keyword: 1179
  structure_level:
    prot_structure: 3
learning_rate: 0.0002
local_rank: 0
log_dir: 
  ../logs/lucagplm/v2.0/token_level,span_level,seq_level,structure_level/lucaone_gplm/20231125113045
logging_steps: 32000
loss_logging_steps: 1000
loss_type:
  token_level:
    gene_mask: cce
    prot_mask: cce
  span_level:
    gene_type: cce
    prot_homo: cce
    prot_site: cce
    prot_domain: cce
  seq_level:
    gene_taxonomy: cce
    prot_taxonomy: cce
    prot_keyword: bce
  structure_level:
    prot_structure: l1
loss_weights:
  token_level:
    gene_mask: 1.0
    prot_mask: 1.0
  span_level:
    gene_type: 0.2
    prot_homo: 0.2
    prot_site: 0.2
    prot_domain: 0.2
  seq_level:
    gene_taxonomy: 0.2
    prot_taxonomy: 0.2
    prot_keyword: 1.0
  structure_level:
    prot_structure: 1.0
lr_update_steps: 760000
max_grad_norm: 1.0
max_length: 1280
max_steps: 16000000
model_config: ../config/lucaone_gplm.json
model_dirpath:
model_type: lucaone_gplm
multi_loss_strategy: manual_weight
n_gpu: 8
no_cuda: false
no_position_embeddings: true
no_token_dropout: true
no_token_type_embeddings: false
no_use_embed_layer_norm: true
no_use_last_layer_norm: false
non_ignore:
num_attention_heads: 40
num_hidden_layers: 20
num_train_epochs: 5
output_dir: 
  ../models/lucagplm/v2.0/token_level,span_level,seq_level,structure_level/lucaone_gplm/20231125113045
output_keys:
  token_level:
  - gene_mask
  - prot_mask
  span_level:
  - gene_type
  - prot_homo
  - prot_site
  - prot_domain
  seq_level:
  - gene_taxonomy
  - prot_taxonomy
  - prot_keyword
  structure_level:
  - prot_structure
output_mode:
  token_level:
    gene_mask: multi_class
    prot_mask: multi_class
  span_level:
    gene_type: multi_class
    prot_homo: multi_class
    prot_site: multi_class
    prot_domain: multi_class
  seq_level:
    gene_taxonomy: multi_class
    prot_taxonomy: multi_class
    prot_keyword: multi_label
  structure_level:
    prot_structure: regression
padding: right
pair_label_size_dict: {}
pair_output_keys: {}
pair_output_mode_dict: {}
per_gpu_eval_batch_size: 1
per_gpu_train_batch_size: 1
pooling_type:
  token_level:
    gene_mask: value_attention
    prot_mask: value_attention
  span_level:
    gene_type: value_attention
    prot_homo: value_attention
    prot_site: value_attention
    prot_domain: value_attention
  seq_level:
    gene_taxonomy: value_attention
    prot_taxonomy: value_attention
    prot_keyword: value_attention
  structure_level:
    prot_structure: value_attention
pos_weight:
pretrain_task_level_name: 
  gene_mask,gene_type,gene_taxonomy,prot_mask,prot_site,prot_homo,prot_domain,prot_taxonomy,prot_keyword,prot_structure
pretrain_task_level_type:
- token_level
- span_level
- seq_level
- structure_level
pretrain_tasks:
  token_level:
  - gene_mask
  - prot_mask
  span_level:
  - gene_type
  - prot_homo
  - prot_site
  - prot_domain
  seq_level:
  - gene_taxonomy
  - prot_taxonomy
  - prot_keyword
  structure_level:
  - prot_structure
pretrained_model_name: esm2_t36_3B_UR50D
prot_contact_classifier_size: 3072
prot_contact_label_filepath:
prot_contact_loss_type: mae
prot_contact_output_mode:
prot_contact_weight: 1.0
prot_domain_classifier_size: 10240
prot_domain_label_filepath: ../label/lucagplm/v2.0/prot_domain_span_level_label_v2.txt
prot_domain_loss_type: cce
prot_domain_output_mode: multi_class
prot_domain_weight: 0.2
prot_homo_classifier_size: 4096
prot_homo_label_filepath: ../label/lucagplm/v2.0/prot_homo_span_level_label_v2.txt
prot_homo_loss_type: cce
prot_homo_output_mode: multi_class
prot_homo_weight: 0.2
prot_keyword_classifier_size: 2048
prot_keyword_label_filepath: ../label/lucagplm/v2.0/prot_keyword_seq_level_label_v2.txt
prot_keyword_loss_type: bce
prot_keyword_output_mode: multi_label
prot_keyword_weight: 1.0
prot_label_size_dict:
  token_level:
    prot_mask: 39
  span_level:
    prot_homo: 3443
    prot_site: 946
    prot_domain: 13717
  seq_level:
    prot_taxonomy: 2196
    prot_keyword: 1179
  structure_level:
    prot_structure: 3
prot_mask_classifier_size: 2048
prot_mask_label_filepath: ../vocab/lucagplm/v2.0/vocab.txt
prot_mask_loss_type: cce
prot_mask_output_mode: multi_class
prot_mask_weight: 1.0
prot_output_keys:
  token_level:
  - prot_mask
  span_level:
  - prot_homo
  - prot_site
  - prot_domain
  seq_level:
  - prot_taxonomy
  - prot_keyword
  structure_level:
  - prot_structure
prot_output_mode_dict:
  token_level:
    prot_mask: multi_class
  span_level:
    prot_homo: multi_class
    prot_site: multi_class
    prot_domain: multi_class
  seq_level:
    prot_taxonomy: multi_class
    prot_keyword: multi_label
  structure_level:
    prot_structure: regression
prot_secondary_classifier_size: 3072
prot_secondary_label_filepath:
prot_secondary_loss_type: mae
prot_secondary_output_mode:
prot_secondary_weight: 1.0
prot_site_classifier_size: 1024
prot_site_label_filepath: ../label/lucagplm/v2.0/prot_site_span_level_label_v2.txt
prot_site_loss_type: cce
prot_site_output_mode: multi_class
prot_site_weight: 0.2
prot_structure_classifier_size: 128
prot_structure_label_filepath: ../label/lucagplm/v2.0/prot_structure_structure_level_label_v2.txt
prot_structure_loss_type: l1
prot_structure_output_mode: regression
prot_structure_weight: 1.0
prot_taxonomy_classifier_size: 2048
prot_taxonomy_label_filepath: ../label/lucagplm/v2.0/prot_taxonomy_seq_level_label_v2.txt
prot_taxonomy_loss_type: cce
prot_taxonomy_output_mode: multi_class
prot_taxonomy_weight: 0.2
save_all: true
save_steps: 200000
scheduler_type: step
seed: 1111
sigmoid:
  token_level:
    gene_mask: false
    prot_mask: false
  span_level:
    gene_type: false
    prot_homo: false
    prot_site: false
    prot_domain: false
  seq_level:
    gene_taxonomy: false
    prot_taxonomy: false
    prot_keyword: true
  structure_level:
    prot_structure: false
start_epoch: 2
tb_log_dir: 
  ../tb-logs/lucagplm/v2.0/token_level,span_level,seq_level,structure_level/lucaone_gplm/20231125113045
test_data_dir: ../dataset/lucagplm/v2.0/test/
tokenization: false
tokenizer_dir: ../vocab/lucagplm/v2.0/vocab.txt
train_data_dir: ../dataset/lucagplm/v2.0/train/
trans_classifier_size: 128
trans_label_filepath: ../label/lucagplm/v2.0/trans_pair_level_label_v2.txt
trans_loss_type: bce
trans_output_mode: binary_class
trans_weight: 1.0
truncation: right
vocab_path: ../vocab/lucagplm/v2.0/vocab.txt
vocab_size: 39
warmup_steps: 64000
weight_decay: 0.01
worker_num: 8
