# Control
results_dir: experiments/baselines/protein/small/fibo

# Global setting
seed: 0

# Sampling
system_prompt: You are conducting Bayesian optimization (Thompson sampling) fully in context. You are provided a list of candidate solutions and the rewards achieved by these solutions. Propose a new distinct solution that maximizes the reward. Your novel candidate solution must be enclosed by <candidate> </candidate>. Never repeat previous solutions. Your search space is over amino acid sequences, with each amino acid represented as a single-letter code./no_think
prompt: "MINDLLDISRIISGKMTLDRAEVNLTAIARQVVEEQRQAAEAKSIQLLCSTPDTNHYVFG\nDFDRLKQTLWNLLSNAVKFTPSGGTVELELGYNAEGMEVYVKDSGIGIDPAFLPYVFDRF\nRQSDAADSRNYGGLGLGLAIVKHLLDLHEGNVSAQSEGFGKGATFTVLLPLKPLKRELAA\nVNRHTAVQQSAPLNDNLAGMKILIVEDRPDTNEMVSYILEEAGAIVETAESGAAALTSLK\nSYSPDLVLSDIGMPMMDGYEMIEYIREWKTTKGG"
tokenizer: Qwen/Qwen3-0.6B
generator: Qwen/Qwen3-0.6B
num_samples: 1000
temperature: 1.0
max_new_tokens: 2048

# Reward feedback
reward_function: protein_stability

# Weights and Biases
tags:
  - protein
  - FIBO
notes: ""