task: calculate_sparse_attns #calculate_tda_features_from_sparce_matrix 

batch_size: 160 
num_workers: 32 #64

device: cpu #cuda:0 # cpu
#layer: 28
subset: train #test #val #train #val #test #val #test #train #val #train #val

# Calculate attention
model_name: facebook/esm2_t33_650M_UR50D  #facebook/esm2_t36_3B_UR50D #
log_file: log.txt
sum: True #False
attn: attns #attns_with_cls
threshold: 0.9 #0.99 0.999
num_layers: 6 #33 #24 #33 #24 #33 #36 #33 
num_heads: 20 #20 #32 #20 #32 #20 #40 #20 
method: 3 #3 #1
graph_laplacian: False 
with_vert: true 
