# Control
results_dir: experiments/baselines/protein/long/small/fibo

# Global setting
seed: 0

# Sampling
system_prompt: You are conducting Bayesian optimization (Thompson sampling) fully in context. You are provided a list of candidate solutions and the rewards achieved by these solutions. Propose a new distinct solution that maximizes the reward. Your novel candidate solution must be enclosed by <candidate> </candidate>. Never repeat previous solutions. Your search space is over amino acid sequences, with each amino acid represented as a single-letter code./no_think
prompt: "MINDLLDISRIISGKMTLDRAEVNLTAIARQVVEEQRQAAEAKSIQLLCSTPDTNHYVFG\nDFDRLKQTLWNLLSNAVKFTPSGGTVELELGYNAEGMEVYVKDSGIGIDPAFLPYVFDRF\nRQSDAADSRNYGGLGLGLAIVKHLLDLHEGNVSAQSEGFGKGATFTVLLPLKPLKRELAA\nVNRHTAVQQSAPLNDNLAGMKILIVEDRPDTNEMVSYILEEAGAIVETAESGAAALTSLK\nSYSPDLVLSDIGMPMMDGYEMIEYIREWKTTKGG"
tokenizer: Qwen/Qwen3-0.6B
generator: Qwen/Qwen3-0.6B
num_samples: 10000
temperature: 1.0
max_new_tokens: 2048
top_o: 10
bo_batch_size: 16 # also batch size of batched generation

# Reward feedback
reward_function: protein_stability

# Weights and Biases
tags:
  - protein
  - FIBO
notes: ""