CASE: amino_GNN
ACTION: precompute
# ----- Model config -----:
MODEL_NAME: esm2_t33_650M_UR50D
SEQ_MODEL_NAME: esm2_t33_650M_UR50D
SEQ_MODEL_PATH : /mnt/ProtLig_GPCRclassA/ProtLig_GPCRclassA/huggingface_models/models--facebook--esm2_t33_650M_UR50D/pytorch_model.bin
SEQ_MODEL_CONFIG_PATH : /mnt/ProtLig_GPCRclassA/ProtLig_GPCRclassA/huggingface_models/models--facebook--esm2_t33_650M_UR50D/config.json
SEQ_MODEL_TOKENIZER_PATH : /mnt/ProtLig_GPCRclassA/ProtLig_GPCRclassA/huggingface_models/models--facebook--esm2_t33_650M_UR50D
BATCH_SIZE: 2
HIDDEN_STATES_SHAPE: [512,1280]
MAX_LENGTH: 512
# ----- File config -----:
HUGGINGFACE_CACHE_DIR: /mnt/ProtLig_GPCRclassA/ProtLig_GPCRclassA/.tokenizers/esm2_t33_650M_UR50D
DATA_FILE: /mnt/ProtLig_GPCRclassA/ProtLig_GPCRclassA/amino_GNN/Data/m2or_conc_mixDiscard_20250501-165522/seqs/discard_by_length/seqs_lower296_upperInf.csv
SAVE_DIR: /mnt/ProtLig_GPCRclassA/ProtLig_GPCRclassA/amino_GNN/Data/m2or_conc_mixDiscard_20250501-165522/seqs/discard_by_length
MODE: w
DBNAME: esm2_t33_650M_UR50D.h5
ID_COL: seq_id
SEQ_COL: mutated_sequence