Skip to content

Commit

Permalink
Merge pull request #115 from worc4021/feature/ma27
Browse files Browse the repository at this point in the history
MA27 interface
  • Loading branch information
cvanaret authored Nov 30, 2024
2 parents e10b16e + 27af512 commit 9fb6506
Show file tree
Hide file tree
Showing 5 changed files with 499 additions and 5 deletions.
15 changes: 14 additions & 1 deletion CMakeLists.txt
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
# Copyright (c) 2018-2024 Charlie Vanaret
# Copyright (c) 2018-2024 Charlie Vanaret
# Licensed under the MIT license. See LICENSE file in the project directory for details.

cmake_minimum_required(VERSION 3.7)
Expand Down Expand Up @@ -107,6 +107,12 @@ else()
else()
message(WARNING "Optional library MA57 was not found.")
endif()
find_library(MA27 ma27)
if(MA27)
link_to_uno(ma27 ${MA27})
else()
message(WARNING "Optional library MA27 was not found.")
endif()
endif()
if(HSL OR MA57)
list(APPEND UNO_SOURCE_FILES uno/solvers/MA57/MA57Solver.cpp)
Expand All @@ -115,6 +121,13 @@ if(HSL OR MA57)
find_package(BLAS REQUIRED)
list(APPEND LIBRARIES ${BLAS_LIBRARIES})
endif()
if(HSL OR MA27)
list(APPEND UNO_SOURCE_FILES uno/solvers/MA27/MA27Solver.cpp)
list(APPEND TESTS_UNO_SOURCE_FILES unotest/functional_tests/MA27SolverTests.cpp)

find_package(BLAS REQUIRED)
list(APPEND LIBRARIES ${BLAS_LIBRARIES})
endif()

# METIS
find_library(METIS metis)
Expand Down
318 changes: 318 additions & 0 deletions uno/solvers/MA27/MA27Solver.cpp
Original file line number Diff line number Diff line change
@@ -0,0 +1,318 @@
// Copyright (c) 2024 Manuel Schaich
// Licensed under the MIT license. See LICENSE file in the project directory for details.

#include <cassert>
#include "MA27Solver.hpp"
#include "linear_algebra/SymmetricMatrix.hpp"
#include "linear_algebra/Vector.hpp"
#include "tools/Logger.hpp"
#include "fortran_interface.h"

#define MA27ID FC_GLOBAL(ma27id, MA27ID)
#define MA27AD FC_GLOBAL(ma27ad, MA27AD)
#define MA27BD FC_GLOBAL(ma27bd, MA27BD)
#define MA27CD FC_GLOBAL(ma27cd, MA27CD)

extern "C"
{
void MA27ID(int ICNTL[], double CNTL[]);

void MA27AD(int *N, int *NZ, int IRN[], int ICN[], int IW[], int *LIW, int IKEEP[], int IW1[],
int *NSTEPS, int *IFLAG, int ICNTL[], double CNTL[], int INFO[], double *OPS);

void MA27BD(int *N, int *NZ, int IRN[], int ICN[], double A[], int *LA, int IW[], int *LIW,
int IKEEP[], int *NSTEPS, int *MAXFRT, int IW1[], int ICNTL[], double CNTL[], int INFO[]);

void MA27CD(int *N, double A[], int *LA, int IW[], int *LIW, double W[], int *MAXFRT, double RHS[],
int IW1[], int *NSTEPS, int ICNTL[], int INFO[]);
}

namespace uno
{


enum eICNTL {
LP = 0, // Used by the subroutines as the output stream for error messages. If it is set to zero these messages will be suppressed. The default value is 6.
MP, // Used by the subroutines as the output stream for diagnostic printing and for warning messages. If it is set to zero then messages are suppressed. The default value is 6.
LDIAG, // Used by the subroutines to control diagnostic printing. If ICNTL(3) is equal to zero (the default), no diagnostic printing will be produced, a value of 1 will print scalar parameters (both in argument lists and in the control and information arrays) and a few entries of array parameters on entry and successful exit from each subroutine while ICNTL(3) equal to 2 will print all parameter values on entry and successful exit.
/* The entries ICNTL(4) to ICNTL(25) are not of interest to the general user and are discussed more fully by Duff and Reid (AERE R-10533, 1982) under the internal names IOVFLO, NEMIN and IFRLVL
*/
IOVFLO,
NEMIN,
IFRLVL1,
IFRLVL2,
IFRLVL3,
IFRLVL4,
IFRLVL5,
IFRLVL6,
IFRLVL7,
IFRLVL8,
IFRLVL9,
IFRLVL10,
IFRLVL11,
IFRLVL12,
IFRLVL13,
IFRLVL14,
IFRLVL15,
IFRLVL16,
IFRLVL17,
IFRLVL18,
IFRLVL19,
IFRLVL20,
UNUSED_ICNTL1,
UNUSED_ICNTL2,
UNUSED_ICNTL3,
UNUSED_ICNTL4,
UNUSED_ICNTL5,
};

enum eCNTL {
U = 0, // Used by the subroutine to control numerical pivoting. Values greater than 0.5 are treated as 0.5 and less than –0.5 as –0.5. Its default value is 0.1. If U is positive, numerical pivoting will be performed. If U is non-positive, no pivoting will be performed, the subroutine will fail if a zero pivot is encountered, and a flag (see section 2.3) will be set if not all pivots are of the same sign; the factorization will continue after a sign change is detected if U is zero but will exit immediately if U is less than zero. If the system is definite, then setting U to zero will decrease the factorization time while still providing a stable decomposition. For problems requiring greater than average numerical care a higher value than the default would be advisable.
FRATIO, // Given the default value of 1.0 by MA27I/ID. If MA27A/AD encounters a row of the reduced matrix with a proportion of entries greater than FRATIO, the row is treated as full. FRATIO is not altered by MA27.
PIVTOL, // Given the default value of 0.0 by MA27I/ID. MA27B/BD will not accept an entry with absolute value less than PIVTOL as a 1×1 pivot or the off-diagonal entry of a 2×2 pivot. PIVTOL is not altered by MA27.
UNUSED_CNTL1,
UNUSED_CNTL2,
};

enum eINFO {
IFLAG = 0, // An error flag. A value of zero indicates that the subroutine has performed successfully.
IERROR, // Provides supplementary information when there is an error.
NRLTOT, // Gives the total amount of REAL words required for a successful completion of MA27B/BD without the need for data compression provided no numerical pivoting is performed. The actual amount required may be higher because of numerical pivoting, but probably not by more than 3%.
NIRTOT, // Gives the total amount of INTEGER words required for a successful completion of MA27B/BD without the need for data compression provided no numerical pivoting is performed. The actual amount required may be higher because of numerical pivoting, but probably not by more than 3%.
NRLNEC, // Gives the amount of REAL words required for successful completion of MA27B/BD allowing data compression (see NCMPBR returned in INFO(12)), again provided no numerical pivoting is performed. Numerical pivoting may cause a higher value to be required, but probably not by more than 3%. If storage was conserved by equivalencing IW(1) with IRN(1), NRLNEC and NIRNEC cannot be calculated exactly but instead an upper bound will be returned. Experience has shown that this can overestimate the exact values by 50% although the tightness of the bound is very problem dependent. For example, a tight bound will generally be obtained if there are many more entries in the factors than in the input matrix.
NIRNEC, // Gives the amount of INTEGER words required for successful completion of MA27B/BD allowing data compression (see NCMPBR returned in INFO(12)), again provided no numerical pivoting is performed. Numerical pivoting may cause a higher value to be required, but probably not by more than 3%. If storage was conserved by equivalencing IW(1) with IRN(1), NRLNEC and NIRNEC cannot be calculated exactly but instead an upper bound will be returned. Experience has shown that this can overestimate the exact values by 50% although the tightness of the bound is very problem dependent. For example, a tight bound will generally be obtained if there are many more entries in the factors than in the input matrix.
NRLADU, // Gives the number of REAL words required to hold the matrix factors if no numerical pivoting is performed by MA27B/BD. Numerical pivoting may change this slightly.
NIRADU, // Gives the number of INTEGER words required to hold the matrix factors if no numerical pivoting is performed by MA27B/BD. Numerical pivoting may change this slightly.
NRLBDU, // Gives the amount of REAL words actually used to hold the factorization.
NIRBDU, // Gives the amount of INTEGER words actually used to hold the factorization.
NCMPA, // Holds the number of compresses of the internal data structure performed by MA27A/AD. If this is high (say > 10), the performance of MA27A/AD may be improved by increasing the length of array IW.
NCMPBR, // Holds the number of compresses of the real data structure required by the factorization. If either of these is high (say > 10), then the speed of the factorization may be increased by allocating more space to the arrays A as appropriate.
NCMPBI, // Holds the number of compresses of the integer data structure required by the factorization. If either of these is high (say > 10), then the speed of the factorization may be increased by allocating more space to the arrays IW as appropriate.
NTWO, // Gives the number of 2×2 pivots used during the factorization.
NEIG, // Gives the number of negative eigenvalues of A.
UNUSED_INFO1,
UNUSED_INFO2,
UNUSED_INFO3,
UNUSED_INFO4,
UNUSED_INFO5,
};

enum eIFLAG {
NSTEPS = -7, // Value of NSTEPS outside the range 1 ≤ NSTEPS ≤ N (MA27B/BD entry).
PIVOTSIGN = -6, // A change of sign of pivots has been detected when U was negative. INFO(2) is set to the pivot step at which the change was detected. (MA27B/BD entry only)
SINGULAR = -5, // Matrix is singular (MA27B/BD entry only). INFO(2) is set to the pivot step at which singularity was detected
INSUFFICIENTREAL = -4, // Failure due to insufficient space allocated to array A (MA27B/BD entry only). INFO(2) is set to a value that may suffice.
INSUFFICIENTINTEGER = -3, // Failure due to insufficient space allocated to array IW (MA27A/AD and MA27B/BD entries). INFO(2) is set to a value that may suffice.
NZOUTOFRANGE = -2, // Value of NZ out of range. NZ < 0. (MA27A/AD and MA27B/BD entries)
NOUTOFRANGE = -1, // Value of N out of range. N < 1. (MA27A/AD and MA27B/BD entries).
SUCCESS = 0, // Successful completion.
IDXOUTOFRANGE = 1, // ndex (in IRN or ICN) out of range. Action taken by subroutine is to ignore any such entries and continue (MA27A/AD and MA27B/BD entries). INFO(2) is set to the number of faulty entries. Details of the first ten are printed on unit ICNTL(2).
FALSEDEFINITENESS, // Pivots have different signs when factorizing a supposedly definite matrix (when the value of U in CNTL(1) is zero) (MA27B/BD entry only). INFO(2) is set to the number of sign changes. Note that this warning will overwrite an INFO(1)=1 warning. Details of the first ten are printed on unit ICNTL(2).
RANKDEFECT, // Matrix is rank deficient. In this case, a decomposition will still have been produced which will enable the subsequent solution of consistent equations (MA27B/BD entry only). INFO(2) will be set to the rank of the matrix. Note that this warning will overwrite an INFO(1)=1 or INFO(1)=2 warning.
};


MA27Solver::MA27Solver(size_t max_dimension, size_t max_number_nonzeros)
: DirectSymmetricIndefiniteLinearSolver<size_t, double>(max_dimension)
, nz_max(static_cast<int>(max_number_nonzeros))
, n(static_cast<int>(max_dimension))
, nnz(static_cast<int>(max_number_nonzeros))
, irn(max_number_nonzeros)
, icn(max_number_nonzeros)
, iw((2 * max_number_nonzeros + 3 * max_dimension + 1) * 6 / 5)
, ikeep(3 * max_number_nonzeros)
, iw1(2 * max_dimension)
{

iflag = 0;
// set the default values of the controlling parameters
MA27ID(icntl.data(), cntl.data());
// suppress warning messages
icntl[eICNTL::LP] = 0;
icntl[eICNTL::MP] = 0;
icntl[eICNTL::LDIAG] = 0;
}

void MA27Solver::factorize(const SymmetricMatrix<size_t, double> &matrix)
{
// // general factorization method: symbolic factorization and numerical factorization
do_symbolic_factorization(matrix);
do_numerical_factorization(matrix);
}

void MA27Solver::do_symbolic_factorization(const SymmetricMatrix<size_t, double> &matrix)
{
assert(matrix.dimension() <= iw1.capacity() && "MA27Solver: the dimension of the matrix is larger than the preallocated size");
assert(matrix.number_nonzeros() <= irn.capacity() &&
"MA27Solver: the number of nonzeros of the matrix is larger than the preallocated size");

// build the internal matrix representation
save_matrix_to_local_format(matrix);

n = static_cast<int>(matrix.dimension());
nnz = static_cast<int>(matrix.number_nonzeros());

// symbolic factorization
int liw = static_cast<int>(iw.size());
MA27AD( &n, &nnz, /* size info */
irn.data(), icn.data(), /* matrix indices */
iw.data(), &liw, ikeep.data(), iw1.data(), /* solver workspace */
&nsteps, &iflag,
icntl.data(), cntl.data(),
info.data(), &ops);

factor.resize(static_cast<std::size_t>(3 * info[eINFO::NRLNEC] / 2));

std::copy(matrix.data_pointer(), matrix.data_pointer() + matrix.number_nonzeros(), factor.begin());

assert(eIFLAG::SUCCESS == info[eINFO::IFLAG] && "MA27: the symbolic factorization failed");
if (eIFLAG::SUCCESS != info[eINFO::IFLAG] )
{
WARNING << "MA27 has issued a warning: IFLAG = " << info[eINFO::IFLAG] << " additional info, IERROR = " << info[eINFO::IERROR] << '\n';
}
}

void MA27Solver::repeat_factorization_after_resizing([[maybe_unused]]const SymmetricMatrix<size_t, double> &matrix) {
if (eIFLAG::INSUFFICIENTINTEGER == info[eINFO::IFLAG])
{
INFO << "MA27: insufficient integer workspace, resizing and retrying. \n";
// increase the size of iw
iw.resize(static_cast<std::size_t>(info[eINFO::IERROR]));
}

if (eIFLAG::INSUFFICIENTREAL == info[eINFO::IFLAG])
{
INFO << "MA27: insufficient real workspace, resizing and retrying. \n";
// increase the size of factor
factor.resize(static_cast<std::size_t>(info[eINFO::IERROR]));
}

int la = static_cast<int>(factor.size());
int liw = static_cast<int>(iw.size());

MA27BD(&n, &nnz, irn.data(), icn.data(), factor.data(), &la, iw.data(), &liw,
ikeep.data(), &nsteps, &maxfrt, iw1.data(), icntl.data(), cntl.data(), info.data());

if (eIFLAG::INSUFFICIENTINTEGER == info[eINFO::IFLAG] || eIFLAG::INSUFFICIENTREAL == info[eINFO::IFLAG])
{
repeat_factorization_after_resizing(matrix);
}
}

void MA27Solver::do_numerical_factorization([[maybe_unused]]const SymmetricMatrix<size_t, double> &matrix)
{
assert(matrix.dimension() <= iw1.capacity() && "MA27Solver: the dimension of the matrix is larger than the preallocated size");
assert(nnz == static_cast<int>(matrix.number_nonzeros()) && "MA27Solver: the numbers of nonzeros do not match");

// numerical factorization
int la = static_cast<int>(factor.size());
int liw = static_cast<int>(iw.size());
MA27BD(&n, &nnz, irn.data(), icn.data(), factor.data(), &la, iw.data(), &liw,
ikeep.data(), &nsteps, &maxfrt, iw1.data(), icntl.data(), cntl.data(), info.data());

if (eIFLAG::INSUFFICIENTINTEGER == info[eINFO::IFLAG] || eIFLAG::INSUFFICIENTREAL == info[eINFO::IFLAG])
{
repeat_factorization_after_resizing(matrix);
}

switch (info[eINFO::IFLAG])
{
case NSTEPS:
WARNING << "MA27BD: Value of NSTEPS outside the range 1 ≤ NSTEPS ≤ N" << '\n';
break;
case PIVOTSIGN:
WARNING << "MA27BD: A change of sign of pivots has been detected when U was negative. Detected at pivot step " << info[eINFO::IERROR] << '\n';
break;
case SINGULAR:
WARNING << "MA27BD: Matrix is singular. Singularity detected during pivot step "<< info[eINFO::IERROR] << '\n';
break;
case NZOUTOFRANGE:
WARNING << "MA27BD: Value of NZ out of range. NZ < 0." << '\n';
break;
case NOUTOFRANGE:
WARNING << "MA27BD: Value of N out of range. N < 1." << '\n';
break;
case IDXOUTOFRANGE:
WARNING << "MA27BD: Index (in IRN or ICN) out of range. " << info[eINFO::IERROR] << " indices affected." << '\n';
break;
case FALSEDEFINITENESS:
WARNING << "MA27BD: Matrix was supposed to be definite, but pivots have different signs when factorizing. Detected " << info[eINFO::IERROR] << " sign changes." << '\n';
break;
case RANKDEFECT:
WARNING << "MA27BD: Matrix is rank deficient. Rank: " << info[eINFO::IERROR] << " whereas dimension " << n << '\n';
break;
}

}

void MA27Solver::solve_indefinite_system([[maybe_unused]]const SymmetricMatrix<size_t, double> &matrix, const Vector<double> &rhs, Vector<double> &result)
{
// solve
std::vector<double> w(maxfrt); // double workspace
int la = static_cast<int>(factor.size());
int liw = static_cast<int>(iw.size());

result = rhs;

MA27CD( &n,
factor.data(),
&la,
iw.data(),
&liw,
w.data(),
&maxfrt,
result.data(),
iw1.data(),
&nsteps,
icntl.data(),
info.data());

assert(info[eINFO::IFLAG] == eIFLAG::SUCCESS && "MA27: the solution failed");
if (eIFLAG::SUCCESS != info[eINFO::IFLAG] )
{
WARNING << "MA27 has issued a warning: IFLAG = " << info[eINFO::IFLAG] << " additional info, IERROR = " << info[eINFO::IERROR] << '\n';
}
}

std::tuple<size_t, size_t, size_t> MA27Solver::get_inertia() const
{
// rank = number_positive_eigenvalues + number_negative_eigenvalues
// n = rank + number_zero_eigenvalues
const size_t rankA = rank();
const size_t num_negative_eigenvalues = number_negative_eigenvalues();
const size_t num_positive_eigenvalues = rankA - num_negative_eigenvalues;
const size_t num_zero_eigenvalues = static_cast<size_t>(n) - rankA;
return std::make_tuple(num_positive_eigenvalues, num_negative_eigenvalues, num_zero_eigenvalues);
}

size_t MA27Solver::number_negative_eigenvalues() const
{
return static_cast<size_t>(info[eINFO::NEIG]);
}

bool MA27Solver::matrix_is_singular() const
{
return (info[eINFO::IFLAG] == eIFLAG::SINGULAR || info[eINFO::IFLAG] == eIFLAG::RANKDEFECT);
}

size_t MA27Solver::rank() const
{
return info[eINFO::IFLAG] == eIFLAG::RANKDEFECT ? static_cast<size_t>(info[eINFO::IERROR]) : static_cast<size_t>(n);
}

void MA27Solver::save_matrix_to_local_format(const SymmetricMatrix<size_t, double> &matrix)
{
// build the internal matrix representation
irn.clear();
icn.clear();
factor.clear();
constexpr auto fortran_shift = 1;
for (const auto [row_index, column_index, element] : matrix)
{
irn.emplace_back(static_cast<int>(row_index + fortran_shift));
icn.emplace_back(static_cast<int>(column_index + fortran_shift));
factor.emplace_back(element);
}
}

} // namespace uno
Loading

0 comments on commit 9fb6506

Please sign in to comment.