from torch import Tensor


def hamming_loss(prediction: Tensor, target: Tensor) -> Tensor:
    """
    Computes the Hamming distance between `prediction` and `target`.

    Returns the Hamming distance, summed over all positions in an instance and averaged over all instances.
    Size `[]`.

    Implementation following
    https://github.com/uclnlp/torch-imle/blob/b6678cd77a1a7218de6daa0f777ba6cf6cc5d9a6/annotation-cli.py#L48

    See also https://en.wikipedia.org/wiki/Hamming_distance
    """
    # this is essentially a differentiable version of  errors = prediction != target
    errors = prediction * (1.0 - target) + (1.0 - prediction) * target
    return errors.mean(dim=0).sum()
