matrix

Compute the nth power of a square matrix.

Parameters:

Name	Type	Description	Default
`mx`	`Tensor`	The input matrix, must be square (2D tensor).	required
`n`	`int`	The exponent to raise the matrix to.	required

Returns:

Type	Description
`Tensor`	The matrix raised to the nth power.

Notes

If n = 0, the identity matrix of the same size as mx is returned.
If n = 1, the input matrix mx is returned.
For n > 1, recursive computation is used.

Raises:

Type	Description
`AssertionError`	If the input matrix is not 2D.

Source code in tinybig/koala/linear_algebra/matrix.py

def matrix_power(mx: torch.Tensor, n: int) -> torch.Tensor:
    """
    Compute the nth power of a square matrix.

    Parameters
    ----------
    mx : torch.Tensor
        The input matrix, must be square (2D tensor).
    n : int
        The exponent to raise the matrix to.

    Returns
    -------
    torch.Tensor
        The matrix raised to the nth power.

    Notes
    -----
    - If n = 0, the identity matrix of the same size as `mx` is returned.
    - If n = 1, the input matrix `mx` is returned.
    - For n > 1, recursive computation is used.

    Raises
    ------
    AssertionError
        If the input matrix is not 2D.
    """
    assert mx is not None and mx.ndim == 2

    if n == 0:
        # Return identity matrix of the same shape as mx
        return torch.eye(mx.shape[0], dtype=mx.dtype, device=mx.device)
    elif n == 1:
        return mx
    elif n % 2 == 0:
        half_power = matrix_power(mx, n // 2)
        return half_power @ half_power
    else:
        return mx @ matrix_power(mx, n - 1)

Compute the sum of matrix powers from 1 to n.

Parameters:

Name	Type	Description	Default
`mx`	`Tensor`	The input matrix, must be square (2D tensor).	required
`n`	`int`	The highest power to sum up to.	required

Returns:

Type	Description
`Tensor`	The accumulative matrix power, i.e., mx + mx^2 + ... + mx^n.

Raises:

Type	Description
`AssertionError`	If the input matrix is not 2D.

Source code in tinybig/koala/linear_algebra/matrix.py

def accumulative_matrix_power(mx: torch.Tensor, n: int) -> torch.Tensor:
    """
    Compute the sum of matrix powers from 1 to n.

    Parameters
    ----------
    mx : torch.Tensor
        The input matrix, must be square (2D tensor).
    n : int
        The highest power to sum up to.

    Returns
    -------
    torch.Tensor
        The accumulative matrix power, i.e., mx + mx^2 + ... + mx^n.

    Raises
    ------
    AssertionError
        If the input matrix is not 2D.
    """
    assert mx is not None and mx.ndim == 2

    ac_mx_power = mx.clone()  # Initialize with the first power (mx^1)
    adj_powers = mx.clone()   # Initialize with the first power (mx^1)

    for i in range(2, n + 1):
        adj_powers = mx @ adj_powers  # Compute the next power
        ac_mx_power += adj_powers     # Add to the accumulative sum

    return ac_mx_power

Normalize a matrix based on its row or column sums.

Parameters:

Name	Type	Description	Default
`mx`	`Tensor`	The input matrix, can be dense or sparse.	required
`mode`	`str`	The normalization mode: - "row": Normalize each row by its sum. - "column": Normalize each column by its sum. - "row_column": Normalize both rows and columns by their respective sums.	`'row'`

Returns:

Type	Description
`Tensor`	The degree-normalized matrix.

Raises:

Type	Description
`ValueError`	If an invalid mode is specified.
`AssertionError`	If the input matrix is not 2D.

Source code in tinybig/koala/linear_algebra/matrix.py

def degree_based_normalize_matrix(mx: torch.Tensor, mode: str = "row") -> torch.Tensor:
    """
    Normalize a matrix based on its row or column sums.

    Parameters
    ----------
    mx : torch.Tensor
        The input matrix, can be dense or sparse.
    mode : str
        The normalization mode:
        - "row": Normalize each row by its sum.
        - "column": Normalize each column by its sum.
        - "row_column": Normalize both rows and columns by their respective sums.

    Returns
    -------
    torch.Tensor
        The degree-normalized matrix.

    Raises
    ------
    ValueError
        If an invalid mode is specified.
    AssertionError
        If the input matrix is not 2D.
    """
    sparse_tag = False
    if mx.is_sparse:
        # Convert sparse matrix to dense
        mx = mx.to_dense()
        sparse_tag = True

    assert mx is not None and mx.ndim == 2

    if mode == "row":
        # Row normalization: Divide each row by the square root of its row sum
        row_sums = mx.sum(dim=1)
        row_sums[row_sums == 0] = 1  # Avoid division by zero
        normalized_mx = mx / row_sums.unsqueeze(1)

    elif mode == "column":
        # Column normalization: Divide each column by the square root of its column sum
        col_sums = mx.sum(dim=0)
        col_sums[col_sums == 0] = 1  # Avoid division by zero
        normalized_mx = mx / col_sums.unsqueeze(0)

    elif mode == "row_column":
        # Step 1: Row normalization with sqrt
        row_sums = mx.sum(dim=1)
        row_sums[row_sums == 0] = 1  # Avoid division by zero
        mx = mx / torch.sqrt(row_sums.unsqueeze(1))

        # Step 2: Column normalization with sqrt
        col_sums = mx.sum(dim=0)
        col_sums[col_sums == 0] = 1  # Avoid division by zero
        normalized_mx = mx / torch.sqrt(col_sums.unsqueeze(0))

    else:
        raise ValueError("Invalid normalization option. Choose 'row', 'column', or 'row_column'.")

    if sparse_tag:
        normalized_mx = normalized_mx.to_sparse_coo()
    return normalized_mx

Normalize a matrix using a custom operator.

Parameters:

Name	Type	Description	Default
`mx`	`Tensor`	The input matrix, can be dense or sparse.	required
`mask_zeros`	`bool`	Whether to mask zero elements before normalization.	`False`
`rescale_factor`	`float`	A scaling factor to adjust the matrix values.	`1.0`
`operator`	`callable`	A function applied for normalization (e.g., `softmax`).	`softmax`
`mode`	`str`	The normalization mode: - "row": Apply the operator row-wise. - "column": Apply the operator column-wise. - "row_column": Apply the operator first row-wise, then column-wise.	`'row'`

Returns:

Type	Description
`Tensor`	The operator-normalized matrix.

Raises:

Type	Description
`ValueError`	If an invalid mode is specified.
`AssertionError`	If the input matrix is not 2D.

Source code in tinybig/koala/linear_algebra/matrix.py

def operator_based_normalize_matrix(
    mx: torch.Tensor,
    mask_zeros: bool = False,
    rescale_factor: float = 1.0,
    operator: callable = torch.nn.functional.softmax,
    mode="row"
) -> torch.Tensor:
    """
    Normalize a matrix using a custom operator.

    Parameters
    ----------
    mx : torch.Tensor
        The input matrix, can be dense or sparse.
    mask_zeros : bool, optional
        Whether to mask zero elements before normalization.
    rescale_factor : float, optional
        A scaling factor to adjust the matrix values.
    operator : callable
        A function applied for normalization (e.g., `softmax`).
    mode : str
        The normalization mode:
        - "row": Apply the operator row-wise.
        - "column": Apply the operator column-wise.
        - "row_column": Apply the operator first row-wise, then column-wise.

    Returns
    -------
    torch.Tensor
        The operator-normalized matrix.

    Raises
    ------
    ValueError
        If an invalid mode is specified.
    AssertionError
        If the input matrix is not 2D.
    """
    if mx.is_sparse:
        mx = mx.to_dense()  # Convert sparse matrix to dense

    assert mx is not None and mx.ndim == 2

    mx = mx * rescale_factor

    if mask_zeros:
        mask = (mx != 0).float()
        large_negative_value = -1e9
        masked_mx = mx.clone()
        masked_mx[mx == 0] = large_negative_value
    else:
        masked_mx = mx
        mask = None

    if mode == "row":
        normalized_mx = operator(masked_mx, dim=1)
    elif mode == 'column':
        normalized_mx = operator(masked_mx, dim=0)
    elif mode == "row-column":
        masked_mx = operator(masked_mx, dim=1)
        normalized_mx = operator(masked_mx, dim=0)
    else:
        raise ValueError("Invalid normalization option. Choose 'row', 'column', or 'row-column'.")

    if mask_zeros:
        normalized_mx = normalized_mx * mask

    return normalized_mx

Normalize a matrix based on its mean and standard deviation.

Parameters:

Name	Type	Description	Default
`mx`	`Tensor`	The input matrix.	required
`mode`	`str`	The normalization mode: - "row": Normalize each row. - "column": Normalize each column. - "row_column" or "all": Normalize based on global mean and standard deviation.	`'column'`

Returns:

Type	Description
`Tensor`	The normalized matrix.

Raises:

Type	Description
`ValueError`	If an invalid mode is specified.

Source code in tinybig/koala/linear_algebra/matrix.py

def mean_std_based_normalize_matrix(mx: torch.Tensor, mode="column"):
    """
    Normalize a matrix based on its mean and standard deviation.

    Parameters
    ----------
    mx : torch.Tensor
        The input matrix.
    mode : str
        The normalization mode:
        - "row": Normalize each row.
        - "column": Normalize each column.
        - "row_column" or "all": Normalize based on global mean and standard deviation.

    Returns
    -------
    torch.Tensor
        The normalized matrix.

    Raises
    ------
    ValueError
        If an invalid mode is specified.
    """
    if mode == "row":
        # Normalize each row (across instances)
        row_means = mx.mean(dim=1, keepdim=True)
        row_stds = mx.std(dim=1, keepdim=True)
        normalized_mx = (mx - row_means) / (row_stds + 1e-8)
    elif mode == "column":
        # Normalize each column (across time)
        col_means = mx.mean(dim=0, keepdim=True)
        col_stds = mx.std(dim=0, keepdim=True)
        normalized_mx = (mx - col_means) / (col_stds + 1e-8)
    elif mode in ["row_column", "column_row", "all"]:
        global_mean = mx.mean()
        global_std = mx.std()
        normalized_mx = (mx - global_mean) / (global_std + 1e-8)
    else:
        raise ValueError("Invalid mode. Choose from 'row', 'column', or 'row_column'.")
    return normalized_mx

Convert a scipy sparse matrix to a PyTorch sparse tensor.

Parameters:

Name	Type	Description	Default
`sparse_mx`	`scipy.sparse matrix`	The input sparse matrix in scipy format.	required

Returns:

Type	Description
`Tensor`	The converted PyTorch sparse tensor.

Source code in tinybig/koala/linear_algebra/matrix.py

def sparse_mx_to_torch_sparse_tensor(sparse_mx):
    """
    Convert a scipy sparse matrix to a PyTorch sparse tensor.

    Parameters
    ----------
    sparse_mx : scipy.sparse matrix
        The input sparse matrix in scipy format.

    Returns
    -------
    torch.sparse.Tensor
        The converted PyTorch sparse tensor.
    """
    sparse_mx = sparse_mx.tocoo().astype(np.float32)
    indices = torch.from_numpy(
        np.vstack((sparse_mx.row, sparse_mx.col)).astype(np.int64))
    values = torch.from_numpy(sparse_mx.data)
    shape = torch.Size(sparse_mx.shape)
    return torch.sparse_coo_tensor(indices, values, shape)