kernel

Selects and applies a specific kernel function based on the given name.

Parameters:

Name	Type	Description	Default
`kernel_name`	`str`	Name of the kernel function to be used. Options include: 'pearson_correlation', 'kl_divergence', 'rv_coefficient', 'mutual_information', 'custom_hybrid', and their batch counterparts.	`'pearson_correlation'`
`x`	`Tensor`	The first input tensor for the kernel function.	`None`
`x2`	`Tensor`	The second input tensor for pairwise kernel functions.	`None`
`*args`		Additional arguments for specific kernel functions.	`()`
`**kwargs`		Additional arguments for specific kernel functions.	`()`

Returns:

Type	Description
`Tensor`	The result of the selected kernel function.

Raises:

Type	Description
`ValueError`	If the specified kernel function is not supported.

Source code in tinybig/koala/statistics/kernel.py

def kernel(
    kernel_name: str = 'pearson_correlation',
    x: torch.Tensor = None, x2: torch.Tensor = None,
    *args, **kwargs
):
    """
    Selects and applies a specific kernel function based on the given name.

    Parameters
    ----------
    kernel_name : str
        Name of the kernel function to be used. Options include:
        'pearson_correlation', 'kl_divergence', 'rv_coefficient',
        'mutual_information', 'custom_hybrid', and their batch counterparts.
    x : torch.Tensor
        The first input tensor for the kernel function.
    x2 : torch.Tensor, optional
        The second input tensor for pairwise kernel functions.
    *args, **kwargs
        Additional arguments for specific kernel functions.

    Returns
    -------
    torch.Tensor
        The result of the selected kernel function.

    Raises
    ------
    ValueError
        If the specified kernel function is not supported.
    """

    if 'batch' in kernel_name:
        assert x is not None and x2 is None
    else:
        assert x is not None and x2 is not None

    match kernel_name:
        case 'pearson_correlation_kernel' | 'pearson_correlation' | 'pearson': return instance_pearson_correlation_kernel(x1=x, x2=x2)
        case 'batch_pearson_correlation_kernel' | 'batch_pearson_correlation' | 'batch_pearson': return batch_pearson_correlation_kernel(x=x, *args, **kwargs)

        case 'kl_divergence_kernel' | 'kl_divergence': return instance_kl_divergence_kernel(x1=x, x2=x2)
        case 'batch_kl_divergence_kernel' | 'batch_kl_divergence': return batch_kl_divergence_kernel(x=x, *args, **kwargs)

        case 'rv_coefficient_kernel' | 'rv_coefficient': return instance_rv_coefficient_kernel(x1=x, x2=x2)
        case 'batch_rv_coefficient_kernel' | 'batch_rv_coefficient': return batch_rv_coefficient_kernel(x=x, *args, **kwargs)

        case 'mutual_information_kernel' | 'mutual_information': return instance_mutual_information_kernel(x1=x, x2=x2)
        case 'batch_mutual_information_kernel' | 'batch_mutual_information': return batch_mutual_information_kernel(x=x, *args, **kwargs)

        case 'custom_hybrid_kernel' | 'custom_hybrid': return instance_custom_hybrid_kernel(x1=x, x2=x2, *args, **kwargs)
        case 'batch_custom_hybrid_kernel' | 'batch_custom_hybrid': return batch_custom_hybrid_kernel(x=x, *args, **kwargs)

        case _: raise ValueError(f'kernel {kernel_name} not supported')

Computes the KL Divergence between distributions.

Parameters:

Name	Type	Description	Default
`x`	`Tensor`	Input tensor representing probabilities.	required
`x2`	`Tensor`	Second tensor representing probabilities for pairwise divergence.	`None`
`dim`	`int`	Dimension along which divergence is calculated. Default is 0.	`0`

Returns:

Type	Description
`Tensor`	KL Divergence value or matrix.

Raises:

Type	Description
`ValueError`	If inputs are invalid or have mismatched dimensions.

Source code in tinybig/koala/statistics/kernel.py

def kl_divergence_kernel(x: torch.Tensor, x2: torch.Tensor = None, dim: int = 0):
    """
    Computes the KL Divergence between distributions.

    Parameters
    ----------
    x : torch.Tensor
        Input tensor representing probabilities.
    x2 : torch.Tensor, optional
        Second tensor representing probabilities for pairwise divergence.
    dim : int, optional
        Dimension along which divergence is calculated. Default is 0.

    Returns
    -------
    torch.Tensor
        KL Divergence value or matrix.

    Raises
    ------
    ValueError
        If inputs are invalid or have mismatched dimensions.
    """
    if x2 is None:
        return batch_kl_divergence_kernel(x=x, dim=dim)
    else:
        return instance_kl_divergence_kernel(x1=x, x2=x2)

Computes the KL Divergence for a batch of distributions.

Parameters:

Name	Type	Description	Default
`x`	`Tensor`	Input tensor of shape (n_samples, n_features).	required
`dim`	`int`	Dimension along which divergence is calculated. Default is 0.	`0`

Returns:

Type	Description
`Tensor`	KL Divergence matrix.

Raises:

Type	Description
`ValueError`	If input tensor is invalid or dimensions are incorrect.

Source code in tinybig/koala/statistics/kernel.py

def batch_kl_divergence_kernel(x: torch.Tensor, dim: int = 0):
    """
    Computes the KL Divergence for a batch of distributions.

    Parameters
    ----------
    x : torch.Tensor
        Input tensor of shape (n_samples, n_features).
    dim : int, optional
        Dimension along which divergence is calculated. Default is 0.

    Returns
    -------
    torch.Tensor
        KL Divergence matrix.

    Raises
    ------
    ValueError
        If input tensor is invalid or dimensions are incorrect.
    """
    if x is None or x.numel() == 0:
        raise ValueError("Input tensors must not be None or empty")
    if x.ndim != 2:
        raise ValueError('x must be of dimension 2...')
    if dim not in [0, 1]:
        raise ValueError('dim must be 0 or 1')

    if dim == 1:
        x = x.T
    b, m = x.shape

    x = torch.softmax(x, dim=0)

    log_x = torch.log(x)
    kl_div_matrix = (x.unsqueeze(2) * (log_x.unsqueeze(2) - log_x.unsqueeze(1))).sum(dim=0)

    assert kl_div_matrix.shape == (m, m)
    return kl_div_matrix

Computes the Pearson correlation coefficient.

Parameters:

Name	Type	Description	Default
`x`	`Tensor`	Input tensor for correlation computation.	required
`x2`	`Tensor`	Second input tensor for pairwise correlation. If None, computes for a batch.	`None`
`dim`	`int`	Dimension along which to compute the correlation. Default is 0.	`0`

Returns:

Type	Description
`Tensor`	Pearson correlation coefficient or matrix.

Raises:

Type	Description
`ValueError`	If input dimensions are invalid or inputs are empty.

Source code in tinybig/koala/statistics/kernel.py

def pearson_correlation_kernel(x: torch.Tensor, x2: torch.Tensor = None, dim: int = 0):
    """
    Computes the Pearson correlation coefficient.

    Parameters
    ----------
    x : torch.Tensor
        Input tensor for correlation computation.
    x2 : torch.Tensor, optional
        Second input tensor for pairwise correlation. If None, computes for a batch.
    dim : int, optional
        Dimension along which to compute the correlation. Default is 0.

    Returns
    -------
    torch.Tensor
        Pearson correlation coefficient or matrix.

    Raises
    ------
    ValueError
        If input dimensions are invalid or inputs are empty.
    """
    if x2 is None:
        return batch_pearson_correlation_kernel(x=x, dim=dim)
    else:
        return instance_pearson_correlation_kernel(x1=x, x2=x2)

Computes the Pearson correlation coefficient matrix for a batch of inputs.

Parameters:

Name	Type	Description	Default
`x`	`Tensor`	Input tensor of shape (n_samples, n_features).	required
`dim`	`int`	Dimension along which to compute correlation. Default is 0.	`0`

Returns:

Type	Description
`Tensor`	Matrix of Pearson correlation coefficients.

Raises:

Type	Description
`ValueError`	If the input tensor is invalid or dimension is incorrect.

Source code in tinybig/koala/statistics/kernel.py

def batch_pearson_correlation_kernel(x: torch.Tensor, dim: int = 0):
    """
    Computes the Pearson correlation coefficient matrix for a batch of inputs.

    Parameters
    ----------
    x : torch.Tensor
        Input tensor of shape (n_samples, n_features).
    dim : int, optional
        Dimension along which to compute correlation. Default is 0.

    Returns
    -------
    torch.Tensor
        Matrix of Pearson correlation coefficients.

    Raises
    ------
    ValueError
        If the input tensor is invalid or dimension is incorrect.
    """
    if x is None or x.numel() == 0:
        raise ValueError("Input tensors must not be None or empty")
    if x.ndim != 2:
        raise ValueError('x must be of dimension 2...')
    if dim not in [0, 1]:
        raise ValueError('dim must be 0 or 1')

    if dim == 1:
        x = x.T
    b, m = x.shape

    x_mean = torch.mean(x, dim=0, keepdim=True)
    x_centered = x - x_mean
    cov_matrix = torch.matmul(x_centered.t(), x_centered) / (b - 1)
    std_devs = torch.std(x_centered, dim=0, correction=1)
    std_matrix = torch.outer(std_devs, std_devs)
    pearson_corr_matrix = cov_matrix / std_matrix

    assert pearson_corr_matrix.shape == (m, m)
    return pearson_corr_matrix

Computes the RV Coefficient for tensors.

Parameters:

Name	Type	Description	Default
`x`	`Tensor`	Input tensor for correlation computation.	required
`x2`	`Tensor`	Second tensor for pairwise coefficient computation.	`None`
`dim`	`int`	Dimension along which the coefficient is computed. Default is 0.	`0`

Returns:

Type	Description
`Tensor`	RV Coefficient value or matrix.

Raises:

Type	Description
`ValueError`	If inputs are invalid or dimensions are mismatched.

Source code in tinybig/koala/statistics/kernel.py

def rv_coefficient_kernel(x: torch.Tensor, x2: torch.Tensor = None, dim: int = 0):
    """
    Computes the RV Coefficient for tensors.

    Parameters
    ----------
    x : torch.Tensor
        Input tensor for correlation computation.
    x2 : torch.Tensor, optional
        Second tensor for pairwise coefficient computation.
    dim : int, optional
        Dimension along which the coefficient is computed. Default is 0.

    Returns
    -------
    torch.Tensor
        RV Coefficient value or matrix.

    Raises
    ------
    ValueError
        If inputs are invalid or dimensions are mismatched.
    """
    if x2 is None:
        return batch_rv_coefficient_kernel(x=x, dim=dim)
    else:
        return instance_rv_coefficient_kernel(x1=x, x2=x2)

Computes the RV Coefficient matrix for a batch of inputs.

Parameters:

Name	Type	Description	Default
`x`	`Tensor`	Input tensor of shape (n_samples, n_features).	required
`dim`	`int`	Dimension along which coefficients are computed. Default is 0.	`0`

Returns:

Type	Description
`Tensor`	RV Coefficient matrix.

Raises:

Type	Description
`ValueError`	If input tensor is invalid or dimensions are incorrect.

Source code in tinybig/koala/statistics/kernel.py

def batch_rv_coefficient_kernel(x: torch.Tensor, dim: int = 0):
    """
    Computes the RV Coefficient matrix for a batch of inputs.

    Parameters
    ----------
    x : torch.Tensor
        Input tensor of shape (n_samples, n_features).
    dim : int, optional
        Dimension along which coefficients are computed. Default is 0.

    Returns
    -------
    torch.Tensor
        RV Coefficient matrix.

    Raises
    ------
    ValueError
        If input tensor is invalid or dimensions are incorrect.
    """
    if x is None or x.numel() == 0:
        raise ValueError("Input tensors must not be None or empty")
    if x.ndim != 2:
        raise ValueError('x must be of dimension 2...')
    if dim not in [0, 1]:
        raise ValueError('dim must be 0 or 1')

    if dim == 1:
        x = x.T
    b, m = x.shape

    # Center the variables
    x_centered = x - torch.mean(x, dim=0, keepdim=True)

    # Covariance matrix for all variables
    cov_matrix = torch.matmul(x_centered.t(), x_centered) / (b - 1)

    # Initialize RV coefficient matrix
    rv_coeff_matrix = torch.zeros(m, m)

    # Compute pairwise RV coefficients
    for i in range(m):
        for j in range(i + 1, m):
            x1_centered = x_centered[:, i]
            x2_centered = x_centered[:, j]

            cov_x1_x2 = torch.dot(x1_centered, x2_centered) / (b - 1)
            var_x1 = torch.dot(x1_centered, x1_centered) / (b - 1)
            var_x2 = torch.dot(x2_centered, x2_centered) / (b - 1)

            # Compute the RV coefficient
            rv_coeff = cov_x1_x2 / torch.sqrt(var_x1 * var_x2)

            # Clamp to the range [0, 1] to handle numerical precision issues
            rv_coeff = torch.clamp(rv_coeff, min=0.0, max=1.0)

            rv_coeff_matrix[i, j] = rv_coeff
            rv_coeff_matrix[j, i] = rv_coeff  # Symmetric entry

    return rv_coeff_matrix

Computes the Mutual Information for tensors.

Parameters:

Name	Type	Description	Default
`x`	`Tensor`	Input tensor for correlation computation.	required
`x2`	`Tensor`	Second tensor for pairwise computation.	`None`
`dim`	`int`	Dimension along which the information is computed. Default is 0.	`0`

Returns:

Type	Description
`Tensor`	Mutual Information value or matrix.

Raises:

Type	Description
`ValueError`	If inputs are invalid or dimensions are mismatched.

Source code in tinybig/koala/statistics/kernel.py

def mutual_information_kernel(x: torch.Tensor, x2: torch.Tensor = None, dim: int = 0):
    """
    Computes the Mutual Information for tensors.

    Parameters
    ----------
    x : torch.Tensor
        Input tensor for correlation computation.
    x2 : torch.Tensor, optional
        Second tensor for pairwise computation.
    dim : int, optional
        Dimension along which the information is computed. Default is 0.

    Returns
    -------
    torch.Tensor
        Mutual Information value or matrix.

    Raises
    ------
    ValueError
        If inputs are invalid or dimensions are mismatched.
    """
    if x2 is None:
        return batch_mutual_information_kernel(x=x, dim=dim)
    else:
        return instance_mutual_information_kernel(x1=x, x2=x2)

Computes the Mutual Information matrix for a batch of inputs.

Parameters:

Name	Type	Description	Default
`x`	`Tensor`	Input tensor of shape (n_samples, n_features).	required
`dim`	`int`	Dimension along which information is computed. Default is 0.	`0`

Returns:

Type	Description
`Tensor`	Mutual Information matrix.

Raises:

Type	Description
`ValueError`	If input tensor is invalid or dimensions are incorrect.

Source code in tinybig/koala/statistics/kernel.py

def batch_mutual_information_kernel(x: torch.Tensor, dim: int = 0):
    """
    Computes the Mutual Information matrix for a batch of inputs.

    Parameters
    ----------
    x : torch.Tensor
        Input tensor of shape (n_samples, n_features).
    dim : int, optional
        Dimension along which information is computed. Default is 0.

    Returns
    -------
    torch.Tensor
        Mutual Information matrix.

    Raises
    ------
    ValueError
        If input tensor is invalid or dimensions are incorrect.
    """
    if x is None or x.numel() == 0:
        raise ValueError("Input tensors must not be None or empty")
    if x.ndim != 2:
        raise ValueError('Input must be a 2D tensor for batch operation.')
    if dim not in [0, 1]:
        raise ValueError('dim must be 0 or 1')

    if dim == 1:
        x = x.T
    b, m = x.shape

    # Center the variables
    x_centered = x - torch.mean(x, dim=0, keepdim=True)

    # Compute the covariance matrix for all variables
    cov_matrix = torch.matmul(x_centered.t(), x_centered) / (b - 1)

    # Get the variances (diagonal elements of the covariance matrix)
    variances = torch.diagonal(cov_matrix)

    # Prevent small or zero variances (to avoid division by zero)
    epsilon = 1e-10
    variances = torch.clamp(variances, min=epsilon)

    # Prepare mutual information matrix
    mi_matrix = torch.zeros(m, m)

    # Loop over pairs of variables and calculate MI based on covariance matrix
    for i in range(m):
        for j in range(i + 1, m):
            x1 = x[:, i]
            x2 = x[:, j]

            # Stack the two variables and compute joint covariance
            x_stack = torch.stack((x1, x2), dim=0)
            cov_joint = torch.cov(x_stack)

            # Determinants
            det_cov_x1 = torch.var(x1, unbiased=True).clamp(min=epsilon)
            det_cov_x2 = torch.var(x2, unbiased=True).clamp(min=epsilon)
            det_cov_joint = torch.linalg.det(cov_joint).clamp(min=epsilon)

            # Mutual information calculation
            mi_value = 0.5 * torch.log(det_cov_x1 * det_cov_x2 / det_cov_joint)
            mi_matrix[i, j] = mi_value
            mi_matrix[j, i] = mi_value  # Symmetric

    return mi_matrix

Combines multiple kernel functions into a custom hybrid kernel.

Parameters:

Name	Type	Description	Default
`x`	`Tensor`	First input tensor.	required
`x2`	`Tensor`	Second input tensor for pairwise kernels.	`None`
`kernels`	`list of callables`	Kernel functions to combine.	`None`
`weights`	`list, tuple, or float`	Weights for combining the kernel functions.	`None`
`dim`	`int`	Dimension for applying the kernels. Default is 0.	`0`

Returns:

Type	Description
`Tensor`	Combined hybrid kernel output.

Raises:

Type	Description
`ValueError`	If the number of kernels and weights do not match or inputs are invalid.

Source code in tinybig/koala/statistics/kernel.py

def custom_hybrid_kernel(x: torch.Tensor, x2: torch.Tensor = None, kernels: List[Callable[[torch.Tensor, torch.Tensor], torch.Tensor]] = None, weights: Union[List, Tuple, float] = None, dim: int = 0):
    """
    Combines multiple kernel functions into a custom hybrid kernel.

    Parameters
    ----------
    x : torch.Tensor
        First input tensor.
    x2 : torch.Tensor, optional
        Second input tensor for pairwise kernels.
    kernels : list of callables
        Kernel functions to combine.
    weights : list, tuple, or float
        Weights for combining the kernel functions.
    dim : int, optional
        Dimension for applying the kernels. Default is 0.

    Returns
    -------
    torch.Tensor
        Combined hybrid kernel output.

    Raises
    ------
    ValueError
        If the number of kernels and weights do not match or inputs are invalid.
    """
    if x2 is None:
        return batch_custom_hybrid_kernel(x=x, kernels=kernels, weights=weights, dim=dim)
    else:
        return instance_custom_hybrid_kernel(x1=x, x2=x2, kernels=kernels, weights=weights)

Combines multiple kernel functions to compute a hybrid kernel matrix for a batch of 2D tensors.

Parameters:

Name	Type	Description	Default
`x`	`Tensor`	The input tensor, must be 2D with shape (n_samples, n_features).	required
`kernels`	`list of callable`	A list of kernel functions to combine.	required
`weights`	`list, tuple, or float`	Weights for combining the kernel functions. If None, equal weights are assigned to all kernels.	`None`
`dim`	`int`	The dimension for applying the kernels. Must be 0 or 1. Default is 0.	`0`

Returns:

Type	Description
`Tensor`	The combined hybrid kernel matrix.

Raises:

Type	Description
`ValueError`	If the input tensor is None, empty, or not 2D. If `dim` is not 0 or 1. If the number of kernels and weights do not match. If kernel outputs have inconsistent shapes.

Source code in tinybig/koala/statistics/kernel.py

def batch_custom_hybrid_kernel(x: torch.Tensor, kernels: List[Callable[[torch.Tensor, torch.Tensor], torch.Tensor]], weights: Union[List, Tuple, float] = None, dim: int = 0):
    """
    Combines multiple kernel functions to compute a hybrid kernel matrix for a batch of 2D tensors.

    Parameters
    ----------
    x : torch.Tensor
        The input tensor, must be 2D with shape (n_samples, n_features).
    kernels : list of callable
        A list of kernel functions to combine.
    weights : list, tuple, or float, optional
        Weights for combining the kernel functions. If None, equal weights are assigned to all kernels.
    dim : int, optional
        The dimension for applying the kernels. Must be 0 or 1. Default is 0.

    Returns
    -------
    torch.Tensor
        The combined hybrid kernel matrix.

    Raises
    ------
    ValueError
        If the input tensor is None, empty, or not 2D.
        If `dim` is not 0 or 1.
        If the number of kernels and weights do not match.
        If kernel outputs have inconsistent shapes.
    """
    if x is None or x.numel() == 0:
        raise ValueError("Input tensors must not be None or empty")
    if x.ndim != 2:
        raise ValueError('x must be of dimension 2...')
    if dim not in [0, 1]:
        raise ValueError('dim must be 0 or 1')

    if kernels is None or len(kernels) == 0:
        raise ValueError("At least one kernel function must be provided.")

    if not isinstance(kernels, list):
        kernels = [kernels]

    if weights is None:
        weights = [1 / len(kernels)] * len(kernels)
    elif not isinstance(weights, list):
        weights = [weights]

    if len(kernels) != len(weights):
        raise ValueError("The number of kernels must match the number of weights.")

    kernel_outputs = [kernel(x) for kernel in kernels]

    shapes = [output.shape for output in kernel_outputs]
    if len(set(shapes)) != 1:
        raise ValueError("All kernel outputs must have the same shape.")

    weighted_sum = sum(weight * output for weight, output in zip(weights, kernel_outputs))
    return weighted_sum