task = "sweep"
seed = 2025


# dataset
dataset = "RNAGymDataset"
dataset_cfg = {
    "seq_type": "dna",
    "path": "data/DMS_RNAGym_substitutions",
    # "num_samples": 30,  # set an integer to limit samples
}
batch_size = 1
num_workers = 4
output_dir = "output/rnagym/evo-1.5-8k-base/date"
metrics = [["ndcg_abs"]]
score_modes = [
    "all"
]  # Options: "all" (avg of for+rev), "for" (forward only), "rev" (reverse only)


# model
model = "EVO1_5_8K_BASE"
kmer = 1
evo1_score = True


# generation
generate_mode = "base_prompt_generation"
generate_cfg = [
    {
        "temperature": 1,
        "top_k": 1,
        "top_p": 1,
        "extra_length": 32,
        "new_length": 32,
    }
]


# evaluation
eval_interval = 10000


# wandb (keep anonymized during review)
use_wandb = False
wandb_proj_name = "ANON_PROJECT"
entity = "ANONYMOUS"
