gpu:
  use: "0,1"

experiment:
  experiment_directory: ""

trainer:
  name : "es"
  parameters:
    batch_size : 2
    num_iterations : 1000           
    population_size : 30           
    sigma : 0.001                      
    alpha : 0.0005                 
    max_new_tokens : 100
    do_sample : False  
    save_every : 200

generator:
  max_new_tokens : 100
  num_return_sequences : 1
  do_sample : False

model:
  name : "Qwen/Qwen2.5-7B-Instruct"
  hf_cache : ""
  device_map : "auto"

tokenizer:
  name : "Qwen/Qwen2.5-7B-Instruct"
  hf_cache : ""
  use_fast : False

dataset:
  name : "prompt_answer"
  data_directory : "data/dummy_dataset.csv"

task:
  name : "absolute_length_difference"

collator:
  name : "data_collator"