import numpy as np

# Dyck grammar and experiment configuration

Hs = [10]
alphas = [1,2]
num_reps = 10
Ns = [5000, 10000, 15000]
num_types = 2

# β parameters for bracket type probabilities (should match LM training)
type_probs = [0.2,0.8]  # Example: 20% '(', 80% '['

# Prefix and completion lengths for value function training
prefix_length = 16  # A
completion_length = 16  # B

# Model path for pretrained LM (update as needed)
model_path = "trained_models/dyck_k2_0.2_0.8_m12_len32/dim512_depth12_heads8/batch32_lr0.0003_wd0.1_warmup100_20250224/0/best.pkl"

# Vocabulary size (2*num_types + 4 for B, E, P, S)
special_tokens = 4
vocab_size = 2 * num_types + special_tokens
alphabet = list(range(vocab_size))


