Source code for nerva_numpy.matrix_operations

# Copyright 2023 Wieger Wesselink.
# Distributed under the Boost Software License, Version 1.0.
# (See accompanying file LICENSE or http://www.boost.org/LICENSE_1_0.txt)

"""Matrix operations built on top of torch to support the math in the library.

The functions here intentionally mirror the names in the accompanying docs.
They operate on 1D/2D tensors and keep broadcasting explicit for clarity.
"""

import numpy as np

Matrix = np.ndarray


# A constant used by inv_sqrt to avoid division by zero
epsilon = 1e-7


[docs] def is_vector(x: Matrix) -> bool: """Check if x is a 1D tensor.""" return len(x.shape) == 1
[docs] def is_column_vector(x: Matrix) -> bool: """Check if x can be treated as a column vector.""" return is_vector(x) or x.shape[1] == 1
[docs] def is_row_vector(x: Matrix) -> bool: """Check if x can be treated as a row vector.""" return is_vector(x) or x.shape[0] == 1
[docs] def vector_size(x: Matrix) -> int: """Get size along first dimension.""" return x.shape[0]
[docs] def is_square(X: Matrix) -> bool: """Check if X is a square matrix.""" m, n = X.shape return m == n
[docs] def dot(x: Matrix, y: Matrix): """Dot product of vectors x and y.""" return np.dot(np.squeeze(x), np.squeeze(y))
[docs] def zeros(m: int, n=None) -> Matrix: """ Returns an mxn matrix with all elements equal to 0. """ return np.zeros((m, n)) if n else np.zeros(m)
[docs] def ones(m: int, n=None) -> Matrix: """ Returns an mxn matrix with all elements equal to 1. """ return np.ones((m, n)) if n else np.ones(m)
[docs] def identity(n: int) -> Matrix: """ Returns the nxn identity matrix. """ return np.eye(n)
[docs] def product(X: Matrix, Y: Matrix) -> Matrix: """Matrix multiplication X @ Y.""" return X @ Y
[docs] def hadamard(X: Matrix, Y: Matrix) -> Matrix: """Element-wise product X ⊙ Y.""" return X * Y
[docs] def diag(X: Matrix) -> Matrix: """Extract diagonal of X as a vector.""" return np.diag(X)
[docs] def Diag(x: Matrix) -> Matrix: """Create diagonal matrix with x as diagonal.""" return np.diagflat(x)
[docs] def elements_sum(X: Matrix): """ Returns the sum of the elements of X. """ return np.sum(X)
[docs] def column_repeat(x: Matrix, n: int) -> Matrix: """Repeat column vector x horizontally n times.""" assert is_column_vector(x) if len(x.shape) == 1: x = x[:, np.newaxis] return np.tile(x, (1, n))
[docs] def row_repeat(x: Matrix, m: int) -> Matrix: """Repeat row vector x vertically m times.""" assert is_row_vector(x) if len(x.shape) == 1: x = x[np.newaxis, :] return np.tile(x, (m, 1))
[docs] def columns_sum(X: Matrix) -> Matrix: """Sum over columns (returns row vector).""" return np.sum(X, axis=0)
[docs] def rows_sum(X: Matrix) -> Matrix: """Sum over rows (returns column vector).""" return np.sum(X, axis=1)
[docs] def columns_max(X: Matrix) -> Matrix: """ Returns a column vector with the maximum values of each row in X. """ return np.max(X, axis=0)
[docs] def rows_max(X: Matrix) -> Matrix: """ Returns a row vector with the maximum values of each column in X. """ return np.max(X, axis=1)
[docs] def columns_mean(X: Matrix) -> Matrix: """ Returns a column vector with the mean values of each row in X. """ return np.mean(X, axis=0)
[docs] def rows_mean(X: Matrix) -> Matrix: """ Returns a row vector with the mean values of each column in X. """ return np.mean(X, axis=1)
[docs] def apply(f, X: Matrix) -> Matrix: """Element-wise application of function f to X.""" return f(X)
[docs] def exp(X: Matrix) -> Matrix: """Element-wise exponential exp(X).""" return np.exp(X)
[docs] def log(X: Matrix) -> Matrix: """Element-wise natural logarithm log(X).""" return np.log(X)
[docs] def reciprocal(X: Matrix) -> Matrix: """Element-wise reciprocal 1/X.""" return 1 / X
[docs] def square(X: Matrix) -> Matrix: """Element-wise square X².""" return np.square(X)
[docs] def sqrt(X: Matrix) -> Matrix: """Element-wise square root √X.""" return np.sqrt(X)
[docs] def inv_sqrt(X: Matrix) -> Matrix: """Element-wise inverse square root X^(-1/2) with epsilon for stability.""" return 1 / np.sqrt(X + epsilon) # The epsilon is needed for numerical stability
[docs] def log_sigmoid(X: Matrix) -> Matrix: """Element-wise log(sigmoid(X)) computed stably.""" return -np.logaddexp(0, -X)