import numpy as np
import math

def pack_more_bits(arr: np.ndarray) -> np.ndarray:
    """
    Assume we have an array of shape (n, m) with values 0 or 1.
    And want to pack the bits along the second axis creating a vector of shape (n,)

    Input array must by of type np.uint8.
    Return array of type np.uint32, where each element is a packed representation of the bits.
    The input array must have at most 32 columns.
    """
    assert arr.ndim == 2, "Input array must be 2D"
    n, m = arr.shape
    assert m <= 32, "Input array must be at most 32 columns"

    p = math.ceil(m / 8)
    padding = (8 - m % 8) % 8
    if padding > 0:
        padding = np.zeros((n, padding), dtype=np.uint8)
        arr = np.concatenate((padding, arr), axis=1)
    arr = arr.reshape(n, -1, p, 8)
    packed = np.packbits(arr).reshape(n, -1)
    packed = np.ascontiguousarray(packed[:, ::-1])

    padding2 = 4 - packed.shape[1]
    padding2 = np.zeros((n, padding2), dtype=np.uint8)
    packed = np.concatenate((packed, padding2), axis=1)
    return packed.view(np.uint32)[:, 0]



def unpack_more_bits(arr: np.ndarray, target_columns: int) -> np.ndarray:
    """
    Unpack the bits from the packed representation.
    Input array must be of type np.uint32.
    Return array of shape (n, target_columns), where each element is a bit.
    n is the number of rows in the input array.
    """
    assert arr.ndim == 1, "Input array must be 1D"
    assert arr.dtype == np.uint32, "Input array must be of type np.uint32"
    
    n = arr.shape[0]
    m = target_columns
    padding1 = (8 - m % 8) % 8
    padding2 = 4 - math.ceil(m / 8)

    arr = arr.reshape(-1, 1).view(np.uint8)[:, ::-1]
    arr = np.ascontiguousarray(arr[:, padding2:])
    unpacked = np.unpackbits(arr).reshape(n, -1)
    unpacked = unpacked[:, padding1:].reshape(n, -1)
    return unpacked