# Control
results_dir: experiments/baselines/hamiltonian/large/filtering
storage_id: Null 
already_generated: False
already_evaluated: False

# Global setting
seed: 0

# Sampling
system_prompt: Null
prompt: |-
 <|fim_prefix|>
 def circuit():
     qc = QuantumCircuit(6)
 <|fim_suffix|>
     return qc
 qc = circuit()
 state = Statevector.from_instruction(qc)
 <|fim_middle|>
tokenizer: Qwen/Qwen2.5-Coder-7B
generator: Qwen/Qwen2.5-Coder-7B
hidden_dim: 3584
num_samples: 1000
batch_size: 64
temperature: 1.0
max_new_tokens: 512

# Reward feedback
reward_function: artificial_quantum_hamiltonian

# Reward model
feature_embedding_model: pauli_observables
embedding_aggregation: nop 
embedding_dim: 211
kernel_feature_transformation: bias # rff(0.5, 10000) #
inverse_pom_activation_exp: inv_vapor_exp

# Bayesian optimization
acquisition_function: IT
n_marginal_likelihood_warmup_steps: 16
ongoing_marginal_likelihood_maximization: True
whitening: False
exploration_bonus: 4.0
nar: 0.01 # accounts for noisy PRM evaluations
observe_invalid_generations: True 

# Weights and Biases
tags:
  - artificial_hamiltonian
notes: ""