import random
from config import alphabet

def reward(seq):
    return 1 if 'a' not in seq else 0

def generate_sample(H):
    seq = []
    for _ in range(H):
        seq.append(random.choice(alphabet))
    return seq, reward(seq)

class ExpectedReward:
    def __init__(self, H):
        self.H = H

    def __call__(self, seq):
        h = len(seq)
        if 'a' in seq:
            return 0.0
        base = (2 / 3) ** (self.H - h)
        return base