Merge pull request #6 from jcapriot/transpose_solve

jcapriot · web-flow · commit 8a92a132d10b · 2023-11-14T11:35:15.000-08:00
add transpose option to solve call
diff --git a/pydiso/mkl_solver.pyx b/pydiso/mkl_solver.pyx
@@ -336,7 +336,7 @@ cdef class MKLPardisoSolver:
     def __call__(self, b):
         return self.solve(b)
 
-    def solve(self, b, x=None):
+    def solve(self, b, x=None, transpose=False):
         """solve(self, b, x=None, transpose=False)
         Solves the equation AX=B using the factored A matrix
 
@@ -354,6 +354,8 @@ cdef class MKLPardisoSolver:
         x : numpy.ndarray, optional
             A pre-allocated output array (of the same data type as A).
             If None, a new array is constructed.
+        transpose : bool, optional
+            If True, it will solve A^TX=B using the factored A matrix.
 
         Returns
         -------
@@ -388,6 +390,10 @@ cdef class MKLPardisoSolver:
 
         cdef int_t nrhs = b.shape[1] if b.ndim == 2 else 1
 
+        if transpose:
+            self.set_iparm(11, 2)
+        else:
+            self.set_iparm(11, 0)
         self._solve(bp, xp, nrhs)
         return x
 
@@ -420,7 +426,7 @@ cdef class MKLPardisoSolver:
         if self._is_32:
             self._par.iparm[i] = val
         else:
-            self._par.iparm[i] = val
+            self._par64.iparm[i] = val
 
     @property
     def nnz(self):
diff --git a/setup.py b/setup.py
@@ -24,7 +24,7 @@ def configuration(parent_package="", top_path=None):
     python_requires=">=3.8",
     setup_requires=[
         "numpy>=1.8",
-        "cython>=3.0",
+        "cython>=0.29.31",
     ],
     install_requires=[
         'numpy>=1.8',
diff --git a/tests/test_pydiso.py b/tests/test_pydiso.py
@@ -9,6 +9,7 @@
     set_mkl_pardiso_threads,
 )
 import pytest
+import sys
 
 np.random.seed(12345)
 n = 40
@@ -39,6 +40,7 @@
                   }
 
 
+@pytest.mark.xfail(sys.platform == "darwin", reason="Unexpected Thread bug in third party library")
 def test_thread_setting():
     n1 = get_mkl_max_threads()
     n2 = get_mkl_pardiso_max_threads()
@@ -93,8 +95,22 @@ def test_solver(A, matrix_type):
     x2 = solver.solve(b)
 
     eps = np.finfo(dtype).eps
-    rel_err = np.linalg.norm(x-x2)/np.linalg.norm(x)
-    assert rel_err < 1E3*eps
+    np.testing.assert_allclose(x, x2, atol=1E3*eps)
+
+@pytest.mark.parametrize("A, matrix_type", inputs)
+def test_transpose_solver(A, matrix_type):
+    dtype = A.dtype
+    if np.issubdtype(dtype, np.complexfloating):
+        x = xc.astype(dtype)
+    else:
+        x = xr.astype(dtype)
+    b = A.T @ x
+
+    solver = Solver(A, matrix_type=matrix_type)
+    x2 = solver.solve(b, transpose=True)
+
+    eps = np.finfo(dtype).eps
+    np.testing.assert_allclose(x, x2, atol=1E3*eps)
 
 def test_multiple_RHS():
     A = A_real_dict["real_symmetric_positive_definite"]
@@ -105,8 +121,7 @@ def test_multiple_RHS():
     x2 = solver.solve(b)
 
     eps = np.finfo(np.float64).eps
-    rel_err = np.linalg.norm(x-x2)/np.linalg.norm(x)
-    assert rel_err < 1E3*eps
+    np.testing.assert_allclose(x, x2, atol=1E3*eps)
 
 
 def test_matrix_type_errors():
@@ -119,6 +134,7 @@ def test_matrix_type_errors():
         solver = Solver(A, matrix_type="real_symmetric_positive_definite")
 
 
+
 def test_rhs_size_error():
     A = A_real_dict["real_symmetric_positive_definite"]
     solver = Solver(A, "real_symmetric_positive_definite")