Merge pull request #179 from joscao/devel/util_linear_algebra

Provide linear algebra utility
ecmwf-ifs · Nov 9, 2023 · ffe94af · ffe94af
2 parents df3f99a + 1754f10
commit ffe94af
Show file tree

Hide file tree

Showing 2 changed files with 398 additions and 0 deletions.
diff --git a/loki/analyse/util_linear_algebra.py b/loki/analyse/util_linear_algebra.py
@@ -0,0 +1,210 @@
+# (C) Copyright 2018- ECMWF.
+# This software is licensed under the terms of the Apache Licence Version 2.0
+# which can be obtained at http://www.apache.org/licenses/LICENSE-2.0.
+# In applying this licence, ECMWF does not waive the privileges and immunities
+# granted to it by virtue of its status as an intergovernmental organisation
+# nor does it submit to any jurisdiction.
+
+import numpy as np
+
+__all__ = [
+    "back_substitution",
+    "generate_row_echelon_form",
+    "is_independent_system",
+    "yield_one_d_systems",
+]
+
+
+def is_independent_system(matrix):
+    """
+    Check if a linear system of equations can be split into independent one-dimensional problems.
+
+    Parameters
+    ----------
+    matrix : numpy.ndarray
+        A rectangular matrix representing coefficients.
+
+    Returns
+    -------
+    bool
+        True if the system can be split into independent one-dimensional problems, False otherwise.
+
+    Notes
+    -----
+    This function checks whether a linear system of equations in the form of `matrix [operator] right_hand_side`
+    can be split into independent one-dimensional problems. The number of problems is determined by the
+    number of variables (the row number of the matrix).
+
+    Each problem consists of a coefficient vector and a right-hand side. The system can be considered independent
+    if each row of the matrix has exactly one non-zero coefficient or no non-zero coefficients.
+    """
+
+    return np.all(np.isin(np.sum(matrix != 0, axis=1), [0, 1]))
+
+
+def yield_one_d_systems(matrix, right_hand_side):
+    """
+    Split a linear system of equations (<=, >=, or ==) into independent one-dimensional problems.
+
+    Parameters
+    ----------
+    matrix : numpy.ndarray
+        A rectangular matrix representing coefficients.
+    right_hand_side : numpy.ndarray
+        The right-hand side vector.
+
+    Yields
+    ------
+    tuple[numpy.ndarray, numpy.ndarray]
+        A tuple containing a coefficient vector and the corresponding right-hand side.
+
+    Notes
+    -----
+    The independence of the problems is NOT explicitly checked; call `is_independent_system` before using this
+    function if unsure.
+
+    This function takes a linear system of equations in the form of `matrix [operator] right_hand_side`,
+    where "matrix" is a rectangular matrix, "x" is a vector of variables, and "right_hand_side" is
+    the right-hand side vector. It splits the system into assumed independent one-dimensional problems.
+
+    Each problem consists of a coefficient vector and a right-hand side. The number of problems is equal to the
+    number of variables (the row number of the matrix).
+
+    Example
+    -------
+    ```python
+    for A, b in yield_one_d_systems(matrix, right_hand_side):
+        # Solve the one-dimensional problem A * x = b
+        solution = solve_one_d_system(A, b)
+    ```
+    """
+    # yield systems with empty left hand side (A) and non empty right hand side
+    mask = np.all(matrix == 0, axis=1)
+    if right_hand_side[mask].size != 0:
+        for A in matrix[mask].T:
+            yield A.reshape((-1,1)), right_hand_side[mask]
+
+    matrix = matrix[~mask]
+    right_hand_side = right_hand_side[~mask]
+
+    if right_hand_side.size != 0:
+        for A in matrix.T:
+            mask = A != 0
+            yield A[mask].reshape((-1,1)), right_hand_side[mask]
+
+
+def back_substitution(
+    upper_triangular_square_matrix,
+    right_hand_side,
+    divison_operation=lambda x, y: x / y,
+):
+    """
+    Solve a linear system of equations using back substitution for an upper triangular square matrix.
+
+    Parameters
+    ----------
+    upper_triangular_square_matrix : numpy.ndarray
+        An upper triangular square matrix (R).
+
+    right_hand_side : numpy.ndarray
+        A vector (y) on the right-hand side of the equation Rx = y.
+
+    division_operation : function, optional
+        A custom division operation function. Default is standard division (/).
+
+    Returns
+    -------
+    numpy.ndarray
+        The solution vector (x) to the system of equations Rx = y.
+
+    Notes
+    -----
+    The function performs back substitution to find the solution vector x for the equation Rx = y,
+    where R is an upper triangular square matrix and y is a vector. The division_operation
+    function is used for division (e.g., for custom division operations).
+
+    The function assumes that the upper right element of the upper_triangular_square_matrix (R)
+    is nonzero for proper back substitution.
+    """
+    R = upper_triangular_square_matrix
+    y = right_hand_side
+
+    x = np.zeros_like(y)
+
+    assert R[-1, -1] != 0
+
+    x[-1] = divison_operation(y[-1], R[-1, -1])
+
+    for i in range(len(y) - 2, -1, -1):
+        x[i] = divison_operation((y[i] - np.dot(R[i, i + 1 :], x[i + 1 :])), R[i, i])
+
+    return x
+
+
+def generate_row_echelon_form(
+    A, conditional_check=lambda A: None, division_operator=lambda x, y: x / y
+):
+    """
+    Calculate the Row Echelon Form (REF) of a matrix.
+
+    Parameters
+    ----------
+    A : numpy.ndarray
+        The input matrix for which the REF is to be calculated.
+    conditional_check : function, optional
+        A custom function to check conditions during the computation.
+    division_operation : function, optional
+        A custom division operation function. Default is standard division (/).
+
+    Returns
+    -------
+    numpy.ndarray
+        The REF of the input matrix A.
+
+    Notes
+    -----
+    - If the input matrix has no rows or columns, it is already in REF, and the function returns itself.
+    - The function utilizes the specified division operation (default is standard division) for division.
+
+    Reference
+    ---------
+    https://math.stackexchange.com/a/3073117
+    for question:
+    https://math.stackexchange.com/questions/3073083/how-to-reduce-matrix-into-row-echelon-form-in-numpy
+    """
+    # if matrix A has no columns or rows,
+    # it is already in REF, so we return itself
+    r, c = A.shape
+    if r == 0 or c == 0:
+        return A
+
+    # we search for non-zero element in the first column
+    for i in range(len(A)):
+        if A[i, 0] != 0:
+            break
+    else:
+        # if all elements in the first column is zero,
+        # we perform REF on matrix from second column
+        B = generate_row_echelon_form(A[:, 1:], conditional_check, division_operator)
+        # and then add the first zero-column back
+        return np.hstack([A[:, :1], B])
+
+    # if non-zero element happens not in the first row,
+    # we switch rows
+    if i > 0:
+        A[[i, 0]] = A[[0, i]]
+
+    # check condition
+    conditional_check(A)
+
+    # we divide first row by first element in it
+    A[0] = division_operator(A[0], A[0, 0])
+    # we subtract all subsequent rows with first row (it has 1 now as first element)
+    # multiplied by the corresponding element in the first column
+    A[1:] -= A[0] * A[1:, 0:1]
+
+    # we perform REF on matrix from second row, from second column
+    B = generate_row_echelon_form(A[1:, 1:], conditional_check, division_operator)
+
+    # we add first row and first (zero) column, and return
+    return np.vstack([A[:1], np.hstack([A[1:, :1], B])])
diff --git a/tests/test_util_linear_algebra.py b/tests/test_util_linear_algebra.py
@@ -0,0 +1,188 @@
+# (C) Copyright 2018- ECMWF.
+# This software is licensed under the terms of the Apache Licence Version 2.0
+# which can be obtained at http://www.apache.org/licenses/LICENSE-2.0.
+# In applying this licence, ECMWF does not waive the privileges and immunities
+# granted to it by virtue of its status as an intergovernmental organisation
+# nor does it submit to any jurisdiction.
+from math import gcd as math_gcd
+import pytest
+import numpy as np
+
+try:
+    _ = math_gcd(4,3,2)
+    gcd = math_gcd
+except TypeError: #Python 3.8 can only handle two arguments
+    from functools import reduce
+    def gcd(*args):
+        return reduce(math_gcd, args)
+
+from loki.analyse.util_linear_algebra import (
+    back_substitution,
+    generate_row_echelon_form,
+    is_independent_system,
+    yield_one_d_systems,
+)
+
+
+@pytest.mark.parametrize(
+    "upper_triangular_square_matrix, right_hand_side, expected, divison_operation",
+    [
+        (
+            [[2, 1, -1], [0, 0.5, 0.5], [0, 0, -1]],
+            [[8], [1], [1]],
+            [[2], [3], [-1]],
+            lambda x, y: x / y,
+        ),
+        (
+            [[2, 0], [0, 1]],
+            [[10], [11]],
+            [[5], [11]],
+            lambda x, y: x // y,
+        ),
+    ],
+)
+def test_backsubstitution(
+    upper_triangular_square_matrix, right_hand_side, expected, divison_operation
+):
+    assert np.allclose(
+        back_substitution(
+            np.array(upper_triangular_square_matrix),
+            np.array(right_hand_side),
+            divison_operation,
+        ),
+        np.array(expected),
+    )
+
+
+@pytest.mark.parametrize(
+    "matrix, result",
+    [
+        ([[2, 0, 1], [0, 2, 0]], [[1, 0, 0.5], [0, 1, 0]]),
+        ([[1, -2, 1, 0], [3, 2, 1, 5]], [[1, -2, 1, 0], [0, 1, -0.25, 0.625]]),
+        ([[1, -1, -10]], [[1, -1, -10]]),
+        ([[0, 0, 0], [0, 0, 0], [0, 0, 0]], [[0, 0, 0], [0, 0, 0], [0, 0, 0]]),
+        ([[1, 2, 3], [4, 5, 6], [7, 8, 9]], [[1, 2, 3], [0, 1, 2], [0, 0, 0]]),
+        ([[0, 1, 0], [0, 0, 1], [0, 0, 0]], [[0, 1, 0], [0, 0, 1], [0, 0, 0]]),
+        (
+            [[2, 4, 6, 8], [1, 2, 3, 4], [3, 6, 9, 12]],
+            [[1, 2, 3, 4], [0, 0, 0, 0], [0, 0, 0, 0]],
+        ),
+        ([[0, 0, 0], [1, 0, 2]], [[1, 0, 2], [0, 0, 0]]),
+    ],
+)
+def test_generate_row_echelon_form(matrix, result):
+    matrix = np.array(matrix, dtype=float)
+    result = np.array(result, dtype=float)
+
+    assert np.allclose(generate_row_echelon_form(matrix), result)
+
+
+@pytest.mark.parametrize(
+    "matrix, result",
+    [
+        ([[]], [[]]),
+        ([[2, 0, 1], [0, 2, 0]], [[1, 0, 0], [0, 1, 0]]),
+        ([[1, -2, 1, 0], [3, 2, 1, 5]], [[1, -2, 1, 0], [0, 1, -1, 0]]),
+        ([[1, -1, -10]], [[1, -1, -10]]),
+        ([[0, 0, 0], [0, 0, 0], [0, 0, 0]], [[0, 0, 0], [0, 0, 0], [0, 0, 0]]),
+        ([[1, 2, 3], [4, 5, 6], [7, 8, 9]], [[1, 2, 3], [0, 1, 2], [0, 0, 0]]),
+        ([[0, 1, 0], [0, 0, 1], [0, 0, 0]], [[0, 1, 0], [0, 0, 1], [0, 0, 0]]),
+        (
+            [[2, 4, 6, 8], [1, 2, 3, 4], [3, 6, 9, 12]],
+            [[1, 2, 3, 4], [0, 0, 0, 0], [0, 0, 0, 0]],
+        ),
+    ],
+)
+def test_enforce_integer_arithmetics_for_row_echelon_form(matrix, result):
+    matrix = np.array(matrix, dtype=float)
+    result = np.array(result, dtype=float)
+
+    assert np.allclose(
+        generate_row_echelon_form(matrix, division_operator=lambda x, y: x // y), result
+    )
+
+
+def _raise_assertion_error(A):
+    raise ValueError()
+
+
+def _require_gcd_condition(A):
+    """Check that gcd condition of linear Diophantine equation is satisfied"""
+    if A[0, -1] % gcd(*A[0, :-1]) != 0:
+        raise ValueError()
+
+
+@pytest.mark.parametrize(
+    "matrix, condition, result",
+    [
+        ([[1, 2, 3], [4, 5, 6]], _raise_assertion_error, None),
+        (
+            [[2, 0, 0, -2, -20], [0, 2, -2, 0, -22]],
+            _require_gcd_condition,
+            [[1, 0, 0, -1, -10], [0, 1, -1, 0, -11]],
+        ),
+        ([[2, 0, 0, -2, -20], [0, 2, -2, 0, -21]], _require_gcd_condition, None),
+    ],
+)
+def test_require_conditions(matrix, condition, result):
+    matrix = np.array(matrix)
+
+    if result is None:
+        with pytest.raises(ValueError):
+            _ = generate_row_echelon_form(matrix, conditional_check=condition)
+    else:
+        result = np.array(result)
+        assert np.allclose(
+            generate_row_echelon_form(matrix, conditional_check=condition), result
+        )
+
+
+@pytest.mark.parametrize(
+    "matrix, expected_result",
+    [
+        (np.array([[1, 0], [0, 1], [0, 0]]), True),
+        (np.array([[1, 0, 0], [0, 1, 0], [0, 0, 1]]), True),
+        (np.array([[1, 0, 1], [0, 1, 0], [0, 0, 0]]), False),
+        (np.array([[0, 0, 0], [0, 0, 0], [0, 0, 0]]), True),
+        (np.array([[1, 0, 0], [0, 0, 1], [0, 1, 0]]), True),
+    ],
+)
+def test_is_independent_system(matrix, expected_result):
+    assert is_independent_system(matrix) == expected_result
+
+
+@pytest.mark.parametrize(
+    "matrix, rhs, list_of_lhs_column, list_of_rhs_column",
+    [
+        (
+            np.array([[1, 0], [0, 1], [0, 0]]),
+            np.array([[1], [2], [0]]),
+            [np.array([[0]]), np.array([[0]]), np.array([[1]]), np.array([[1]])],
+            [np.array([[0]]), np.array([[0]]), np.array([[1]]), np.array([[2]])],
+        ),
+        (
+            np.array([[1, 0], [0, 1], [0, 0]]),
+            np.array([[1], [2], [1]]),
+            [np.array([[0]]), np.array([[0]]), np.array([[1]]), np.array([[1]])],
+            [np.array([[1]]), np.array([[1]]), np.array([[1]]), np.array([[2]])],
+        ),
+        (
+            np.array([[0, 0, 0], [0, 0, 0], [0, 0, 0]]),
+            np.array([[1], [2], [3]]),
+            [np.array([[0], [0], [0]])] * 3,
+            [np.array([[1], [2], [3]])] * 3,
+        ),
+        (  # will even split non independent systems, call is_independent_system before
+            np.array([[2, 1], [1, 3]]),
+            np.array([[3], [4]]),
+            [np.array([[2], [1]]), np.array([[1], [3]])],
+            [np.array([[3], [4]]), np.array([[3], [4]])],
+        ),
+    ],
+)
+def test_yield_one_d_systems(matrix, rhs, list_of_lhs_column, list_of_rhs_column):
+    results = list(yield_one_d_systems(matrix, rhs))
+    assert len(results) == len(list_of_lhs_column) == len(list_of_rhs_column)
+    for index, (A, b) in enumerate(results):
+        assert np.array_equal(A, list_of_lhs_column[index])
+        assert np.array_equal(b, list_of_rhs_column[index])