import numpy as np

def sigmoid(x):
    return 1.0 / (1.0 + np.exp(-x))

def softmax(logits, axis=-1):
    z = logits - np.max(logits, axis=axis, keepdims=True)
    e = np.exp(z)
    return e / np.sum(e, axis=axis, keepdims=True)


def phi(s, a, S, A):
    v = np.zeros(S * A)
    v[s * A + a] = 1.0
    return v

def phi_idx(s, a, S, A):
    return s * A + a

