doc/html/Amesos2__CssMKL__def_8hpp_source.html

 // @HEADER

 // *****************************************************************************

 //           Amesos2: Templated Direct Sparse Solver Package

 //

 // Copyright 2011 NTESS and the Amesos2 contributors.

 // SPDX-License-Identifier: BSD-3-Clause

 // *****************************************************************************

 // @HEADER


 #ifndef AMESOS2_CSSMKL_DEF_HPP

 #define AMESOS2_CSSMKL_DEF_HPP


 #include <map>


 #include <Teuchos_Tuple.hpp>

 #include <Teuchos_toString.hpp>

 #include <Teuchos_StandardParameterEntryValidators.hpp>


 #include "Amesos2_SolverCore_def.hpp"

 #include "Amesos2_CssMKL_decl.hpp"


 namespace Amesos2 {


   namespace PMKL {

 #   include <mkl.h>

 #   include <mkl_pardiso.h>

   }


   template <class Matrix, class Vector>

   CssMKL<Matrix,Vector>::CssMKL(Teuchos::RCP<const Matrix> A,

                                         Teuchos::RCP<Vector>       X,

                                         Teuchos::RCP<const Vector> B)

     : SolverCore<Amesos2::CssMKL,Matrix,Vector>(A, X, B) // instantiate superclass

     , n_(Teuchos::as<int_t>(this->globalNumRows_))

     , perm_(this->globalNumRows_)

     , nrhs_(0)

     , css_initialized_(false)

     , is_contiguous_(true)

     , msglvl_(0)

   {

     // Matrix info

     Teuchos::RCP<const Teuchos::Comm<int> > matComm = this->matrixA_->getComm ();

     const global_ordinal_type indexBase = this->matrixA_->getRowMap ()->getIndexBase ();

     const local_ordinal_type  nrows = this->matrixA_->getLocalNumRows();


     // rowmap for loadA (to have locally contiguous)

     css_rowmap_ =

       Teuchos::rcp (new map_type (this->globalNumRows_, nrows, indexBase, matComm));

     css_contig_rowmap_ = Teuchos::rcp (new map_type (0, 0, indexBase, matComm));

     css_contig_colmap_ = Teuchos::rcp (new map_type (0, 0, indexBase, matComm));


     // set the default matrix type

     set_css_mkl_matrix_type();

     set_css_mkl_default_parameters(pt_, iparm_);


     // index base

     iparm_[34] = (indexBase == 0 ? 1 : 0);  /* Use one or zero-based indexing */

     // 1D block-row distribution (using Contiguous map)

     auto frow  = css_rowmap_->getMinGlobalIndex();

     iparm_[39] = 2;  /* Matrix input format. */

     iparm_[40] = frow;          /* > Beginning of input domain. */

     iparm_[41] = frow+nrows-1;  /* > End of input domain. */


     // get MPI Comm

     TEUCHOS_TEST_FOR_EXCEPTION(

         matComm.is_null (), std::logic_error, "Amesos2::CssMKL "

         "constructor: The matrix's communicator is null!");

     Teuchos::RCP<const Teuchos::MpiComm<int> > matMpiComm =

       Teuchos::rcp_dynamic_cast<const Teuchos::MpiComm<int> > (matComm);

     TEUCHOS_TEST_FOR_EXCEPTION(

       matMpiComm.is_null (), std::logic_error, "Amesos2::CssMKL "

       "constructor: The matrix's communicator is not an MpiComm!");

     TEUCHOS_TEST_FOR_EXCEPTION(

       matMpiComm->getRawMpiComm ().is_null (), std::logic_error, "Amesos2::"

       "CssMKL constructor: The matrix's communicator claims to be a "

       "Teuchos::MpiComm<int>, but its getRawPtrComm() method returns "

       "Teuchos::null!  This means that the underlying MPI_Comm doesn't even "

       "exist, which likely implies that the Teuchos::MpiComm was constructed "

       "incorrectly.  It means something different than if the MPI_Comm were "

       "MPI_COMM_NULL.");

     MPI_Comm CssComm = *(matMpiComm->getRawMpiComm ());

     CssComm_ = MPI_Comm_c2f(CssComm);

   }


   template <class Matrix, class Vector>

   CssMKL<Matrix,Vector>::~CssMKL( )

   {

     /*

      * Free any memory allocated by the CssMKL library functions

      */

     int_t error = 0;

     if (css_initialized_)

     {

       int_t phase = -1;         // release all internal solver memory

       void *bdummy, *xdummy;

       const MPI_Fint CssComm = CssComm_;

       function_map::cluster_sparse_solver( pt_, const_cast<int_t*>(&maxfct_),

                              const_cast<int_t*>(&mnum_), &mtype_, &phase, &n_,

                              nzvals_view_.data(), rowptr_view_.data(),

                              colind_view_.data(), perm_.getRawPtr(), &nrhs_, iparm_,

                              const_cast<int_t*>(&msglvl_), &bdummy, &xdummy, &CssComm, &error );

       css_initialized_ = false;

     }

     check_css_mkl_error(Amesos2::CLEAN, error);

   }


   template<class Matrix, class Vector>

   int

   CssMKL<Matrix,Vector>::preOrdering_impl()

   {

     // preOrdering done during "Analysis" (aka symbolic

     // factorization) phase

     return(0);

   }


   template <class Matrix, class Vector>

   int

   CssMKL<Matrix,Vector>::symbolicFactorization_impl()

   {

     if (msglvl_ > 0 && this->matrixA_->getComm()->getRank() == 0) {

       std::cout << " CssMKL::symbolicFactorization:\n" << std::endl;

       for (int i=0; i < 64; i++) std::cout << " * IPARM[" << i << "] = " << iparm_[i] << std::endl;

     }

     int_t error = 0;

     {

 #ifdef HAVE_AMESOS2_TIMERS

       Teuchos::TimeMonitor symbFactTimer( this->timers_.symFactTime_ );

 #endif


       int_t phase = 11; // Analysis

       void *bdummy, *xdummy;

       const MPI_Fint CssComm = CssComm_;

       function_map::cluster_sparse_solver( pt_, const_cast<int_t*>(&maxfct_),

                              const_cast<int_t*>(&mnum_), &mtype_, &phase, &n_,

                              nzvals_view_.data(), rowptr_view_.data(),

                              colind_view_.data(), perm_.getRawPtr(), &nrhs_, iparm_,

                              const_cast<int_t*>(&msglvl_), &bdummy, &xdummy, &CssComm, &error );

     }

     check_css_mkl_error(Amesos2::SYMBFACT, error);

     if (msglvl_ > 0 && this->matrixA_->getComm()->getRank() == 0) {

       std::cout << " CssMKL::symbolicFactorization done:" << std::endl;

       std::cout << " * Time : " << this->timers_.symFactTime_.totalElapsedTime() << std::endl;

     }


     // Pardiso only lets you retrieve the total number of factor

     // non-zeros, not for each individually.  We should document how

     // such a situation is reported.

     this->setNnzLU(iparm_[17]);

     css_initialized_ = true;

     return(0);

   }


   template <class Matrix, class Vector>

   int

   CssMKL<Matrix,Vector>::numericFactorization_impl()

   {

     if (msglvl_ > 0 && this->matrixA_->getComm()->getRank() == 0) {

       std::cout << " CssMKL::numericFactorization:\n" << std::endl;

     }

     int_t error = 0;

     {

 #ifdef HAVE_AMESOS2_TIMERS

       Teuchos::TimeMonitor numFactTimer( this->timers_.numFactTime_ );

 #endif


       //int_t phase = 12; // Analysis, numerical factorization

       int_t phase = 22; // Numerical factorization

       void *bdummy, *xdummy;

       const MPI_Fint CssComm = CssComm_;

       function_map::cluster_sparse_solver( pt_, const_cast<int_t*>(&maxfct_),

                              const_cast<int_t*>(&mnum_), &mtype_, &phase, &n_,

                              nzvals_view_.data(), rowptr_view_.data(),

                              colind_view_.data(), perm_.getRawPtr(), &nrhs_, iparm_,

                              const_cast<int_t*>(&msglvl_), &bdummy, &xdummy, &CssComm, &error );

     }

     check_css_mkl_error(Amesos2::NUMFACT, error);

     if (msglvl_ > 0 && this->matrixA_->getComm()->getRank() == 0) {

       std::cout << " CssMKL::numericFactorization done:" << std::endl;

       std::cout << " Time : " << this->timers_.numFactTime_.totalElapsedTime() << std::endl;

     }


     return( 0 );

   }


   template <class Matrix, class Vector>

   int

   CssMKL<Matrix,Vector>::solve_impl(const Teuchos::Ptr<MultiVecAdapter<Vector> >       X,

                                     const Teuchos::Ptr<const MultiVecAdapter<Vector> > B) const

   {

     using Teuchos::as;


     // Get B data

     const local_ordinal_type ld_rhs = this->matrixA_->getLocalNumRows();

     nrhs_ = as<int_t>(X->getGlobalNumVectors());


     const size_t val_store_size = as<size_t>(ld_rhs * nrhs_);

     xvals_.resize(val_store_size);

     bvals_.resize(val_store_size);

     {

 #ifdef HAVE_AMESOS2_TIMERS

       Teuchos::TimeMonitor mvConvTimer( this->timers_.vecConvTime_ );

       Teuchos::TimeMonitor redistTimer( this->timers_.vecRedistTime_ );

 #endif


       Util::get_1d_copy_helper<

         MultiVecAdapter<Vector>,

         solver_scalar_type>::do_get(B, bvals_(),

           as<size_t>(ld_rhs),

           Teuchos::ptrInArg(*css_rowmap_));

     }


     int_t error = 0;

     {

 #ifdef HAVE_AMESOS2_TIMERS

       Teuchos::TimeMonitor solveTimer( this->timers_.solveTime_ );

 #endif


       const int_t phase = 33; // Solve, iterative refinement

       const MPI_Fint CssComm = CssComm_;

       function_map::cluster_sparse_solver( pt_,

                              const_cast<int_t*>(&maxfct_),

                              const_cast<int_t*>(&mnum_),

                              const_cast<int_t*>(&mtype_),

                              const_cast<int_t*>(&phase),

                              const_cast<int_t*>(&n_),

                              const_cast<solver_scalar_type*>(nzvals_view_.data()),

                              const_cast<int_t*>(rowptr_view_.data()),

                              const_cast<int_t*>(colind_view_.data()),

                              const_cast<int_t*>(perm_.getRawPtr()),

                              &nrhs_,

                              const_cast<int_t*>(iparm_),

                              const_cast<int_t*>(&msglvl_),

                              as<void*>(bvals_.getRawPtr()),

                              as<void*>(xvals_.getRawPtr()), &CssComm, &error );

     }

     check_css_mkl_error(Amesos2::SOLVE, error);


     /* Get values to X */

     {

 #ifdef HAVE_AMESOS2_TIMERS

       Teuchos::TimeMonitor redistTimer(this->timers_.vecRedistTime_);

 #endif


       Util::put_1d_data_helper<

       MultiVecAdapter<Vector>,

         solver_scalar_type>::do_put(X, xvals_(),

           as<size_t>(ld_rhs),

           Teuchos::ptrInArg(*css_rowmap_));

     }


     return( 0 );

   }


   template <class Matrix, class Vector>

   bool

   CssMKL<Matrix,Vector>::matrixShapeOK_impl() const

   {

     // CssMKL supports square matrices

     return( this->globalNumRows_ == this->globalNumCols_ );

   }


   template <class Matrix, class Vector>

   void

   CssMKL<Matrix,Vector>::setParameters_impl(const Teuchos::RCP<Teuchos::ParameterList> & parameterList )

   {

     using Teuchos::RCP;

     using Teuchos::getIntegralValue;

     using Teuchos::ParameterEntryValidator;


     RCP<const Teuchos::ParameterList> valid_params = getValidParameters_impl();


     // 2: Fill-in reordering from METIS, 3: thread dissection, 10: MPI version of the nested dissection

     if( parameterList->isParameter("IPARM(2)") )

     {

       RCP<const ParameterEntryValidator> fillin_validator = valid_params->getEntry("IPARM(2)").validator();

       parameterList->getEntry("IPARM(2)").setValidator(fillin_validator);

       iparm_[1] = getIntegralValue<int>(*parameterList, "IPARM(2)");

     }


     // Max numbers of iterative refinement steps

     if( parameterList->isParameter("IPARM(8)") )

     {

       RCP<const ParameterEntryValidator> refine_validator = valid_params->getEntry("IPARM(8)").validator();

       parameterList->getEntry("IPARM(8)").setValidator(refine_validator);

       iparm_[7] = getIntegralValue<int>(*parameterList, "IPARM(8)");

     }


     // Perturb the pivot elements

     if( parameterList->isParameter("IPARM(10)") )

     {

       RCP<const ParameterEntryValidator> pivot_perturb_validator = valid_params->getEntry("IPARM(10)").validator();

       parameterList->getEntry("IPARM(10)").setValidator(pivot_perturb_validator);

       iparm_[9] = getIntegralValue<int>(*parameterList, "IPARM(10)");

     }


     // First check if the control object requests a transpose solve.

     // Then solver specific options can override this.

     iparm_[11] = this->control_.useTranspose_ ? 2 : 0;

     // Normal solve (0), or a transpose solve (1)

     if( parameterList->isParameter("IPARM(12)") )

     {

       RCP<const ParameterEntryValidator> trans_validator = valid_params->getEntry("IPARM(12)").validator();

       parameterList->getEntry("IPARM(12)").setValidator(trans_validator);

       iparm_[11] = getIntegralValue<int>(*parameterList, "IPARM(12)");

     }


     // (Non-)symmetric matchings : detault 1 for nonsymmetric and 0 for symmetric matrix (default is nonsymmetric)

     if( parameterList->isParameter("IPARM(13)") )

     {

       RCP<const ParameterEntryValidator> trans_validator = valid_params->getEntry("IPARM(13)").validator();

       parameterList->getEntry("IPARM(13)").setValidator(trans_validator);

       iparm_[12] = getIntegralValue<int>(*parameterList, "IPARM(13)");

     }


     // Output: Number of nonzeros in the factor LU

     if( parameterList->isParameter("IPARM(18)") )

     {

       RCP<const ParameterEntryValidator> report_validator = valid_params->getEntry("IPARM(18)").validator();

       parameterList->getEntry("IPARM(18)").setValidator(report_validator);

       iparm_[17] = getIntegralValue<int>(*parameterList, "IPARM(18)");

     }


     // Check input matrix is sorted

     if( parameterList->isParameter("IPARM(28)") )

     {

       RCP<const ParameterEntryValidator> report_validator = valid_params->getEntry("IPARM(28)").validator();

       parameterList->getEntry("IPARM(28)").setValidator(report_validator);

       iparm_[27] = getIntegralValue<int>(*parameterList, "IPARM(28)");

     }


     if( parameterList->isParameter("IsContiguous") ){

       is_contiguous_ = parameterList->get<bool>("IsContiguous");

     }


     if( parameterList->isParameter("verbose") ){

       msglvl_ = parameterList->get<int>("verbose");

     }

   }


 /*

  * TODO: It would be nice if the parameters could be expressed as

  * either all string or as all integers.  I see no way of doing this

  * at present with the standard validators.  However, we could create

  * our own validators or kindly ask the Teuchos team to add some

  * features for use.

  *

  * The issue is that with the current validators we cannot specify

  * arbitrary sets of numbers that are the only allowed parameters.

  * For example the IPARM(2) parameter can take only the values 0, 2,

  * and 3.  The EnhancedNumberValidator can take a min value, and max

  * value, and a step size, but with those options there is no way to

  * specify the needed set.

  *

  * Another missing feature is the ability to give docstrings for such

  * numbers.  For example IPARM(25) can take on the values 0 and 1.

  * This would be easy enough to accomplish with just a number

  * validator, but then have no way to document the effect of each

  * value.

  */

 template <class Matrix, class Vector>

 Teuchos::RCP<const Teuchos::ParameterList>

 CssMKL<Matrix,Vector>::getValidParameters_impl() const

 {

   using std::string;

   using Teuchos::as;

   using Teuchos::RCP;

   using Teuchos::tuple;

   using Teuchos::toString;

   using Teuchos::EnhancedNumberValidator;

   using Teuchos::setStringToIntegralParameter;

   using Teuchos::anyNumberParameterEntryValidator;


   static Teuchos::RCP<const Teuchos::ParameterList> valid_params;


   if( is_null(valid_params) ){

     Teuchos::RCP<Teuchos::ParameterList> pl = Teuchos::parameterList();


     void* pt_temp[64];

     int_t iparm_temp[64];

     set_css_mkl_default_parameters(pt_temp, iparm_temp);

     setStringToIntegralParameter<int>("IPARM(2)", toString(iparm_temp[1]),

                                       "Fill-in reducing ordering for the input matrix",

                                       tuple<string>("2", "3", "10"),

                                       tuple<string>("Nested dissection algorithm from METIS",

                                       "Parallel version of the nested dissection algorithm",

                                       "MPI version of the nested dissection and symbolic factorization algorithms"),

                                       tuple<int>(2, 3, 10),

                                       pl.getRawPtr());


     setStringToIntegralParameter<int>("IPARM(12)", toString(iparm_temp[11]),

                                       "Solve with transposed or conjugate transposed matrix A",

                                       tuple<string>("0", "1", "2"),

                                       tuple<string>("Non-transposed",

                                       "Conjugate-transposed",

                                       "Transposed"),

                                       tuple<int>(0, 1, 2),

                                       pl.getRawPtr());


     setStringToIntegralParameter<int>("IPARM(13)", toString(iparm_temp[12]),

                                       "Use weighted matching",

                                       tuple<string>("0", "1"),

                                       tuple<string>("No matching", "Use matching"),

                                       tuple<int>(0, 1),

                                       pl.getRawPtr());


     Teuchos::AnyNumberParameterEntryValidator::EPreferredType preferred_int =

       Teuchos::AnyNumberParameterEntryValidator::PREFER_INT;


     Teuchos::AnyNumberParameterEntryValidator::AcceptedTypes accept_int( false );

     accept_int.allowInt( true );


     pl->set("IPARM(8)" , as<int>(iparm_temp[7]) , "Iterative refinement step",

             anyNumberParameterEntryValidator(preferred_int, accept_int));


     pl->set("IPARM(10)", as<int>(iparm_temp[9]) , "Pivoting perturbation",

             anyNumberParameterEntryValidator(preferred_int, accept_int));


     pl->set("IPARM(18)", as<int>(iparm_temp[17]), "Report the number of non-zero elements in the factors",

             anyNumberParameterEntryValidator(preferred_int, accept_int));


     pl->set("IPARM(28)", as<int>(iparm_temp[27]), "Check input matrix is sorted",

             anyNumberParameterEntryValidator(preferred_int, accept_int));


     pl->set("IsContiguous", true, "Whether GIDs contiguous");


     pl->set("verbose", 0, "Verbosity Message Level");


     valid_params = pl;

   }


   return valid_params;

 }


 template <class Matrix, class Vector>

 bool

 CssMKL<Matrix,Vector>::loadA_impl(EPhase current_phase)

 {

 #ifdef HAVE_AMESOS2_TIMERS

   Teuchos::TimeMonitor convTimer(this->timers_.mtxConvTime_);

 #endif


   // CssMKL does not need matrix data in the pre-ordering phase

   if( current_phase == PREORDERING ) return( false );


   // is_contiguous         : input is contiguous

   // CONTIGUOUS_AND_ROOTED : input is not contiguous, so make output contiguous

   EDistribution dist_option = (iparm_[39] != 0 ? DISTRIBUTED_NO_OVERLAP : ((is_contiguous_ == true) ? ROOTED : CONTIGUOUS_AND_ROOTED));

   if (dist_option == DISTRIBUTED_NO_OVERLAP && !is_contiguous_) {

     // Neeed to form contiguous matrix

     #if 1

     // Only reinex GIDs

     css_rowmap_ = this->matrixA_->getRowMap(); // use original map to redistribute vectors in solve

     Teuchos::RCP<const MatrixAdapter<Matrix> > contig_mat = this->matrixA_->reindex(css_contig_rowmap_, css_contig_colmap_, current_phase);

     #else

     // Redistribued matrixA into contiguous GIDs

     Teuchos::RCP<const MatrixAdapter<Matrix> > contig_mat = this->matrixA_->get(ptrInArg(*css_rowmap_));

     //css_rowmap_ = contig_mat->getRowMap(); // use new map to redistribute vectors in solve

     #endif

     // Copy into local views

     if (current_phase == SYMBFACT) {

         Kokkos::resize(nzvals_temp_, contig_mat->getLocalNNZ());

         Kokkos::resize(nzvals_view_, contig_mat->getLocalNNZ());

         Kokkos::resize(colind_view_, contig_mat->getLocalNNZ());

         Kokkos::resize(rowptr_view_, contig_mat->getLocalNumRows() + 1);

     }

     int_t nnz_ret = 0;

     {

 #ifdef HAVE_AMESOS2_TIMERS

       Teuchos::TimeMonitor mtxRedistTimer( this->timers_.mtxRedistTime_ );

 #endif

       Util::get_crs_helper_kokkos_view<MatrixAdapter<Matrix>,

         host_value_type_array,host_ordinal_type_array, host_size_type_array >::do_get(

                                          contig_mat.ptr(),

                                          nzvals_temp_, colind_view_, rowptr_view_,

                                          nnz_ret,

                                          ptrInArg(*(contig_mat->getRowMap())),

                                          #if 1

                                          DISTRIBUTED_NO_OVERLAP,

                                          #else

                                          ROOTED,

                                          #endif

                                          SORTED_INDICES);

       Kokkos::deep_copy(nzvals_view_, nzvals_temp_);

     }

   } else {

     if (current_phase == SYMBFACT) {

       if (dist_option == DISTRIBUTED_NO_OVERLAP) {

         Kokkos::resize(nzvals_temp_, this->matrixA_->getLocalNNZ());

         Kokkos::resize(nzvals_view_, this->matrixA_->getLocalNNZ());

         Kokkos::resize(colind_view_, this->matrixA_->getLocalNNZ());

         Kokkos::resize(rowptr_view_, this->matrixA_->getLocalNumRows() + 1);

       } else {

         if( this->root_ ) {

           Kokkos::resize(nzvals_temp_, this->matrixA_->getGlobalNNZ());

           Kokkos::resize(nzvals_view_, this->matrixA_->getGlobalNNZ());

           Kokkos::resize(colind_view_, this->matrixA_->getGlobalNNZ());

           Kokkos::resize(rowptr_view_, this->matrixA_->getGlobalNumRows() + 1);

         } else {

           Kokkos::resize(nzvals_temp_, 0);

           Kokkos::resize(nzvals_view_, 0);

           Kokkos::resize(colind_view_, 0);

           Kokkos::resize(rowptr_view_, 0);

         }

       }

     }

     int_t nnz_ret = 0;

     {

 #ifdef HAVE_AMESOS2_TIMERS

       Teuchos::TimeMonitor mtxRedistTimer( this->timers_.mtxRedistTime_ );

 #endif

       Util::get_crs_helper_kokkos_view<MatrixAdapter<Matrix>,

         host_value_type_array,host_ordinal_type_array, host_size_type_array >::do_get(

                                          this->matrixA_.ptr(),

                                          nzvals_temp_, colind_view_, rowptr_view_,

                                          nnz_ret,

                                          ptrInArg(*(this->matrixA_->getRowMap())),

                                          dist_option,

                                          SORTED_INDICES);

       Kokkos::deep_copy(nzvals_view_, nzvals_temp_);

     }

   }

   return( true );

 }


 template <class Matrix, class Vector>

 void

 CssMKL<Matrix,Vector>::check_css_mkl_error(EPhase phase,

                                                    int_t error) const

 {

   int error_i = error;

   Teuchos::broadcast(*(this->getComm()), 0, &error_i); // We only care about root's value


   if( error == 0 ) return;      // No error


   std::string errmsg = "Other error";

   switch( error ){

   case -1:

     errmsg = "CssMKL reported error: 'Input inconsistent'";

     break;

   case -2:

     errmsg = "CssMKL reported error: 'Not enough memory'";

     break;

   case -3:

     errmsg = "CssMKL reported error: 'Reordering problem'";

     break;

   case -4:

     errmsg =

       "CssMKL reported error: 'Zero pivot, numerical "

       "factorization or iterative refinement problem'";

     break;

   case -5:

     errmsg = "CssMKL reported error: 'Unclassified (internal) error'";

     break;

   case -6:

     errmsg = "CssMKL reported error: 'Reordering failed'";

     break;

   case -7:

     errmsg = "CssMKL reported error: 'Diagonal matrix is singular'";

     break;

   case -8:

     errmsg = "CssMKL reported error: '32-bit integer overflow problem'";

     break;

   case -9:

     errmsg = "CssMKL reported error: 'Not enough memory for OOC'";

     break;

   case -10:

     errmsg = "CssMKL reported error: 'Problems with opening OOC temporary files'";

     break;

   case -11:

     errmsg = "CssMKL reported error: 'Read/write problem with OOC data file'";

     break;

   }

   errmsg += (" at phase = "+std::to_string(phase));


   TEUCHOS_TEST_FOR_EXCEPTION( true, std::runtime_error, errmsg );

 }


 template <class Matrix, class Vector>

 void

 CssMKL<Matrix,Vector>::set_css_mkl_matrix_type(int_t mtype)

 {

   if( mtype == 0 ){

     if( complex_ ){

       mtype_ = 13;              // complex, unsymmetric

     } else {

       mtype_ = 11;              // real, unsymmetric

     }

   } else {

     switch( mtype ){

     case 11:

       TEUCHOS_TEST_FOR_EXCEPTION( complex_,

                           std::invalid_argument,

                           "Cannot set a real Pardiso matrix type with scalar type complex" );

       mtype_ = 11; break;

     case 13:

       TEUCHOS_TEST_FOR_EXCEPTION( !complex_,

                           std::invalid_argument,

                           "Cannot set a complex Pardiso matrix type with non-complex scalars" );

       mtype_ = 13; break;

     default:

       TEUCHOS_TEST_FOR_EXCEPTION( true,

                           std::invalid_argument,

                           "Symmetric matrices are not yet supported by the Amesos2 interface" );

     }

   }

 }


 template <class Matrix, class Vector>

 void

 CssMKL<Matrix,Vector>::set_css_mkl_default_parameters(void* pt[], int_t iparm[]) const

 {

   for( int i = 0; i < 64; ++i ){

     pt[i] = nullptr;

     iparm[i] = 0;

   }

   iparm[0] = 1; /* No solver default */

   // Reset some of the default parameters

   iparm[1] = 10;  /* 2: Fill-in reordering from METIS, 3: thread dissection, 10: MPI version of the nested dissection and symbolic factorization*/

   iparm[7] = 0;   /* Max numbers of iterative refinement steps */

   iparm[10] = 0;  /* Disable nonsymmetric permutation and scaling MPS */

   iparm[11] = 0;  /* Normal solve (0), or a transpose solve (1) */

   iparm[12] = 0;  /* Do not use (non-)symmetric matchings */

   iparm[17] = -1; /* Output: Number of nonzeros in the factor LU */

   iparm[20] = 1;  /* Pivoting for symmetric indefinite matrices */

   iparm[26] = 1;  /* Check input matrix is sorted */


   // diagonal pertubation

   if (mtype_ == -2 || mtype_ == -4) {

     // symmetric indefinite

     iparm[9] = 8;   /* Perturb the pivot elements with 1E-8 */

   } else {

     // non-symmetric

     iparm[9] = 13;  /* Perturb the pivot elements with 1E-13 */

   }


   // set single or double precision

   if constexpr ( std::is_same_v<solver_magnitude_type, PMKL::_REAL_t> ) {

     iparm[27] = 1;           // single-precision

   } else {

     iparm[27] = 0;           // double-precision

   }

   iparm[34] = 1;  /* Use zero-based indexing */

 }


 template <class Matrix, class Vector>

 const char* CssMKL<Matrix,Vector>::name = "CSSMKL";


 template <class Matrix, class Vector>

 const typename CssMKL<Matrix,Vector>::int_t

 CssMKL<Matrix,Vector>::maxfct_ = 1;


 template <class Matrix, class Vector>

 const typename CssMKL<Matrix,Vector>::int_t

 CssMKL<Matrix,Vector>::mnum_ = 1;


 } // end namespace Amesos


 #endif  // AMESOS2_CSSMKL_DEF_HPP

Amesos2::SolverCore
Amesos2::SolverCore: A templated interface for interaction with third-party direct sparse solvers...
Definition: Amesos2_SolverCore_decl.hpp:71

Amesos2::EPhase
EPhase
Used to indicate a phase in the direct solution.
Definition: Amesos2_TypeDecl.hpp:31

Amesos2::CssMKL::check_css_mkl_error
void check_css_mkl_error(EPhase phase, int_t error) const
Throws an appropriate runtime error in the event that error &lt; 0 .
Definition: Amesos2_CssMKL_def.hpp:548

Amesos2::CssMKL
Amesos2 interface to the CssMKL package.
Definition: Amesos2_CssMKL_decl.hpp:49

Amesos2::CssMKL::~CssMKL
~CssMKL()
Destructor.
Definition: Amesos2_CssMKL_def.hpp:97

Amesos2::SolverCore::globalNumRows_
global_size_type globalNumRows_
Number of global rows in matrixA_.
Definition: Amesos2_SolverCore_decl.hpp:442

Amesos2::CssMKL::iparm_
int_t iparm_[64]
Definition: Amesos2_CssMKL_decl.hpp:279

Amesos2::Util::get_1d_copy_helper
Helper class for getting 1-D copies of multivectors.
Definition: Amesos2_MultiVecAdapter_decl.hpp:233

Amesos2::CssMKL::preOrdering_impl
int preOrdering_impl()
Performs pre-ordering on the matrix to increase efficiency.
Definition: Amesos2_CssMKL_def.hpp:121

Amesos2::CssMKL::CssMKL
CssMKL(Teuchos::RCP< const Matrix > A, Teuchos::RCP< Vector > X, Teuchos::RCP< const Vector > B)
Initialize from Teuchos::RCP.
Definition: Amesos2_CssMKL_def.hpp:40

Amesos2::CssMKL::set_css_mkl_matrix_type
void set_css_mkl_matrix_type(int_t mtype=0)
Definition: Amesos2_CssMKL_def.hpp:602

Amesos2::CssMKL::loadA_impl
bool loadA_impl(EPhase current_phase)
Reads matrix data into internal structures.
Definition: Amesos2_CssMKL_def.hpp:456

Amesos2_CssMKL_decl.hpp
A template class that does nothing useful besides show developers what, in general, needs to be done to add a new solver interface to the Amesos2 collection.

Amesos2::CssMKL::numericFactorization_impl
int numericFactorization_impl()
CssMKL specific numeric factorization.
Definition: Amesos2_CssMKL_def.hpp:169

Amesos2::CssMKL::matrixShapeOK_impl
bool matrixShapeOK_impl() const
Determines whether the shape of the matrix is OK for this solver.
Definition: Amesos2_CssMKL_def.hpp:272

Amesos2::CssMKL::solve_impl
int solve_impl(const Teuchos::Ptr< MultiVecAdapter< Vector > > X, const Teuchos::Ptr< const MultiVecAdapter< Vector > > B) const
CssMKL specific solve.
Definition: Amesos2_CssMKL_def.hpp:202

Amesos2_SolverCore_def.hpp

Amesos2::CssMKL::pt_
void * pt_[64]
CssMKL internal data address pointer.
Definition: Amesos2_CssMKL_decl.hpp:261

Amesos2::CssMKL::getValidParameters_impl
Teuchos::RCP< const Teuchos::ParameterList > getValidParameters_impl() const
Definition: Amesos2_CssMKL_def.hpp:380

Amesos2::Util::get_crs_helper_kokkos_view
Similar to get_ccs_helper , but used to get a CRS representation of the given matrix.
Definition: Amesos2_Util.hpp:629

Amesos2::CssMKL::symbolicFactorization_impl
int symbolicFactorization_impl()
Perform symbolic factorization of the matrix using CssMKL.
Definition: Amesos2_CssMKL_def.hpp:131

Amesos2::CssMKL::setParameters_impl
void setParameters_impl(const Teuchos::RCP< Teuchos::ParameterList > &parameterList)
Definition: Amesos2_CssMKL_def.hpp:281

Amesos2::EDistribution
EDistribution
Definition: Amesos2_TypeDecl.hpp:89

Amesos2::Util::put_1d_data_helper
Helper class for putting 1-D data arrays into multivectors.
Definition: Amesos2_MultiVecAdapter_decl.hpp:339

Amesos2::MultiVecAdapter
A templated MultiVector class adapter for Amesos2.
Definition: Amesos2_MultiVecAdapter_decl.hpp:142

Amesos2::SolverCore::matrixA_
Teuchos::RCP< const MatrixAdapter< Matrix > > matrixA_
The LHS operator.
Definition: Amesos2_SolverCore_decl.hpp:421