doc/html/Ifpack2__Experimental__RBILUK__def_8hpp_source.html

 /*@HEADER

 // ***********************************************************************

 //

 //       Ifpack2: Templated Object-Oriented Algebraic Preconditioner Package

 //                 Copyright (2009) Sandia Corporation

 //

 // Under terms of Contract DE-AC04-94AL85000, there is a non-exclusive

 // license for use of this work by or on behalf of the U.S. Government.

 //

 // Redistribution and use in source and binary forms, with or without

 // modification, are permitted provided that the following conditions are

 // met:

 //

 // 1. Redistributions of source code must retain the above copyright

 // notice, this list of conditions and the following disclaimer.

 //

 // 2. Redistributions in binary form must reproduce the above copyright

 // notice, this list of conditions and the following disclaimer in the

 // documentation and/or other materials provided with the distribution.

 //

 // 3. Neither the name of the Corporation nor the names of the

 // contributors may be used to endorse or promote products derived from

 // this software without specific prior written permission.

 //

 // THIS SOFTWARE IS PROVIDED BY SANDIA CORPORATION "AS IS" AND ANY

 // EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE

 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR

 // PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL SANDIA CORPORATION OR THE

 // CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,

 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,

 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR

 // PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF

 // LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING

 // NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS

 // SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 //

 // Questions? Contact Michael A. Heroux (maherou@sandia.gov)

 //

 // ***********************************************************************

 //@HEADER

 */


 #ifndef IFPACK2_EXPERIMENTAL_CRSRBILUK_DEF_HPP

 #define IFPACK2_EXPERIMENTAL_CRSRBILUK_DEF_HPP


 #include "Tpetra_BlockMultiVector.hpp"

 #include "Tpetra_BlockView.hpp"

 #include "Ifpack2_OverlappingRowMatrix.hpp"

 #include "Ifpack2_LocalFilter.hpp"

 #include "Ifpack2_Utilities.hpp"

 #include "Ifpack2_RILUK.hpp"


 //#define IFPACK2_RBILUK_INITIAL

 #define IFPACK2_RBILUK_INITIAL_NOKK


 #ifndef IFPACK2_RBILUK_INITIAL_NOKK

 #include "KokkosBatched_Gemm_Decl.hpp"

 #include "KokkosBatched_Gemm_Serial_Impl.hpp"

 #include "KokkosBatched_Util.hpp"

 #endif


 namespace Ifpack2 {


 namespace Experimental {


 template<class MatrixType>

 RBILUK<MatrixType>::RBILUK (const Teuchos::RCP<const row_matrix_type>& Matrix_in)

   : RILUK<row_matrix_type>(Teuchos::rcp_dynamic_cast<const row_matrix_type>(Matrix_in) ),

     A_(Matrix_in),

     A_block_(Teuchos::rcp_dynamic_cast<const block_crs_matrix_type>(Matrix_in))

 {}


 template<class MatrixType>

 RBILUK<MatrixType>::RBILUK (const Teuchos::RCP<const block_crs_matrix_type>& Matrix_in)

   : RILUK<row_matrix_type>(Teuchos::rcp_dynamic_cast<const row_matrix_type>(Matrix_in) ),

     A_block_(Matrix_in)

 {}


 template<class MatrixType>

 RBILUK<MatrixType>::~RBILUK() {}


 template<class MatrixType>

 void

 RBILUK<MatrixType>::setMatrix (const Teuchos::RCP<const block_crs_matrix_type>& A)

 {

   // FIXME (mfh 04 Nov 2015) What about A_?  When does that get (re)set?


   // It's legal for A to be null; in that case, you may not call

   // initialize() until calling setMatrix() with a nonnull input.

   // Regardless, setting the matrix invalidates any previous

   // factorization.

   if (A.getRawPtr () != A_block_.getRawPtr ())

   {

     this->isAllocated_ = false;

     this->isInitialized_ = false;

     this->isComputed_ = false;

     this->Graph_ = Teuchos::null;

     L_block_ = Teuchos::null;

     U_block_ = Teuchos::null;

     D_block_ = Teuchos::null;

     A_block_ = A;

   }

 }


 template<class MatrixType>

 const typename RBILUK<MatrixType>::block_crs_matrix_type&

 RBILUK<MatrixType>::getLBlock () const

 {

   TEUCHOS_TEST_FOR_EXCEPTION(

     L_block_.is_null (), std::runtime_error, "Ifpack2::RILUK::getL: The L factor "

     "is null.  Please call initialize() (and preferably also compute()) "

     "before calling this method.  If the input matrix has not yet been set, "

     "you must first call setMatrix() with a nonnull input matrix before you "

     "may call initialize() or compute().");

   return *L_block_;

 }


 template<class MatrixType>

 const typename RBILUK<MatrixType>::block_crs_matrix_type&

 RBILUK<MatrixType>::getDBlock () const

 {

   TEUCHOS_TEST_FOR_EXCEPTION(

     D_block_.is_null (), std::runtime_error, "Ifpack2::RILUK::getD: The D factor "

     "(of diagonal entries) is null.  Please call initialize() (and "

     "preferably also compute()) before calling this method.  If the input "

     "matrix has not yet been set, you must first call setMatrix() with a "

     "nonnull input matrix before you may call initialize() or compute().");

   return *D_block_;

 }


 template<class MatrixType>

 const typename RBILUK<MatrixType>::block_crs_matrix_type&

 RBILUK<MatrixType>::getUBlock () const

 {

   TEUCHOS_TEST_FOR_EXCEPTION(

     U_block_.is_null (), std::runtime_error, "Ifpack2::RILUK::getU: The U factor "

     "is null.  Please call initialize() (and preferably also compute()) "

     "before calling this method.  If the input matrix has not yet been set, "

     "you must first call setMatrix() with a nonnull input matrix before you "

     "may call initialize() or compute().");

   return *U_block_;

 }


 template<class MatrixType>

 void RBILUK<MatrixType>::allocate_L_and_U_blocks ()

 {

   using Teuchos::null;

   using Teuchos::rcp;


   if (! this->isAllocated_) {

     // Deallocate any existing storage.  This avoids storing 2x

     // memory, since RCP op= does not deallocate until after the

     // assignment.

     this->L_ = null;

     this->U_ = null;

     this->D_ = null;

     L_block_ = null;

     U_block_ = null;

     D_block_ = null;


     // Allocate Matrix using ILUK graphs

     L_block_ = rcp(new block_crs_matrix_type(*this->Graph_->getL_Graph (), blockSize_) );

     U_block_ = rcp(new block_crs_matrix_type(*this->Graph_->getU_Graph (), blockSize_) );

     D_block_ = rcp(new block_crs_matrix_type(*(Ifpack2::Details::computeDiagonalGraph(*(this->Graph_->getOverlapGraph()))),

                                              blockSize_) );

     L_block_->setAllToScalar (STM::zero ()); // Zero out L and U matrices

     U_block_->setAllToScalar (STM::zero ());

     D_block_->setAllToScalar (STM::zero ());


   }

   this->isAllocated_ = true;

 }


 template<class MatrixType>

 Teuchos::RCP<const typename RBILUK<MatrixType>::block_crs_matrix_type>

 RBILUK<MatrixType>::getBlockMatrix () const {

   return A_block_;

 }


 template<class MatrixType>

 void RBILUK<MatrixType>::initialize ()

 {

   using Teuchos::RCP;

   using Teuchos::rcp;

   using Teuchos::rcp_dynamic_cast;

   const char prefix[] = "Ifpack2::Experimental::RBILUK::initialize: ";


   // FIXME (mfh 04 Nov 2015) Apparently it's OK for A_ to be null.

   // That probably means that this preconditioner was created with a

   // BlockCrsMatrix directly, so it doesn't need the LocalFilter.


   // TEUCHOS_TEST_FOR_EXCEPTION

   //   (A_.is_null (), std::runtime_error, prefix << "The matrix (A_, the "

   //    "RowMatrix) is null.  Please call setMatrix() with a nonnull input "

   //    "before calling this method.");


   if (A_block_.is_null ()) {

     // FIXME (mfh 04 Nov 2015) Why does the input have to be a

     // LocalFilter?  Why can't we just take a regular matrix, and

     // apply a LocalFilter only if necessary, like other "local"

     // Ifpack2 preconditioners already do?

     RCP<const LocalFilter<row_matrix_type> > filteredA =

       rcp_dynamic_cast<const LocalFilter<row_matrix_type> >(A_);

     TEUCHOS_TEST_FOR_EXCEPTION

       (filteredA.is_null (), std::runtime_error, prefix <<

        "Cannot cast to filtered matrix.");

     RCP<const OverlappingRowMatrix<row_matrix_type> > overlappedA =

       rcp_dynamic_cast<const OverlappingRowMatrix<row_matrix_type> > (filteredA->getUnderlyingMatrix ());

     if (! overlappedA.is_null ()) {

       A_block_ = rcp_dynamic_cast<const block_crs_matrix_type>(overlappedA->getUnderlyingMatrix());

     } else {

       //If there is no overlap, filteredA could be the block CRS matrix

       A_block_ = rcp_dynamic_cast<const block_crs_matrix_type>(filteredA->getUnderlyingMatrix());

     }

   }


   TEUCHOS_TEST_FOR_EXCEPTION

     (A_block_.is_null (), std::runtime_error, prefix << "The matrix (A_block_, "

      "the BlockCrsMatrix) is null.  Please call setMatrix() with a nonnull "

      "input before calling this method.");

   TEUCHOS_TEST_FOR_EXCEPTION

     (! A_block_->isFillComplete (), std::runtime_error, prefix << "The matrix "

      "(A_block_, the BlockCrsMatrix) is not fill complete.  You may not invoke "

      "initialize() or compute() with this matrix until the matrix is fill "

      "complete.  Note: BlockCrsMatrix is fill complete if and only if its "

      "underlying graph is fill complete.");


   blockSize_ = A_block_->getBlockSize();


   Teuchos::Time timer ("RBILUK::initialize");

   { // Start timing

     Teuchos::TimeMonitor timeMon (timer);


     // Calling initialize() means that the user asserts that the graph

     // of the sparse matrix may have changed.  We must not just reuse

     // the previous graph in that case.

     //

     // Regarding setting isAllocated_ to false: Eventually, we may want

     // some kind of clever memory reuse strategy, but it's always

     // correct just to blow everything away and start over.

     this->isInitialized_ = false;

     this->isAllocated_ = false;

     this->isComputed_ = false;

     this->Graph_ = Teuchos::null;


     typedef Tpetra::CrsGraph<local_ordinal_type,

                              global_ordinal_type,

                              node_type> crs_graph_type;


     RCP<const crs_graph_type> matrixCrsGraph = Teuchos::rcpFromRef(A_block_->getCrsGraph() );

     this->Graph_ = rcp (new Ifpack2::IlukGraph<crs_graph_type> (matrixCrsGraph,

         this->LevelOfFill_, 0));


     this->Graph_->initialize ();

     allocate_L_and_U_blocks ();

 #ifdef IFPACK2_RBILUK_INITIAL

     initAllValues (*A_block_);

 #endif

   } // Stop timing


   this->isInitialized_ = true;

   this->numInitialize_ += 1;

   this->initializeTime_ += timer.totalElapsedTime ();

 }


 template<class MatrixType>

 void

 RBILUK<MatrixType>::

 initAllValues (const block_crs_matrix_type& A)

 {

   using Teuchos::RCP;

   typedef Tpetra::Map<local_ordinal_type,global_ordinal_type,node_type> map_type;


   local_ordinal_type NumIn = 0, NumL = 0, NumU = 0;

   bool DiagFound = false;

   size_t NumNonzeroDiags = 0;

   size_t MaxNumEntries = A.getNodeMaxNumRowEntries();

   local_ordinal_type blockMatSize = blockSize_*blockSize_;


   // First check that the local row map ordering is the same as the local portion of the column map.

   // The extraction of the strictly lower/upper parts of A, as well as the factorization,

   // implicitly assume that this is the case.

   Teuchos::ArrayView<const global_ordinal_type> rowGIDs = A.getRowMap()->getNodeElementList();

   Teuchos::ArrayView<const global_ordinal_type> colGIDs = A.getColMap()->getNodeElementList();

   bool gidsAreConsistentlyOrdered=true;

   global_ordinal_type indexOfInconsistentGID=0;

   for (global_ordinal_type i=0; i<rowGIDs.size(); ++i) {

     if (rowGIDs[i] != colGIDs[i]) {

       gidsAreConsistentlyOrdered=false;

       indexOfInconsistentGID=i;

       break;

     }

   }

   TEUCHOS_TEST_FOR_EXCEPTION(gidsAreConsistentlyOrdered==false, std::runtime_error,

                              "The ordering of the local GIDs in the row and column maps is not the same"

                              << std::endl << "at index " << indexOfInconsistentGID

                              << ".  Consistency is required, as all calculations are done with"

                              << std::endl << "local indexing.");


   // Allocate temporary space for extracting the strictly

   // lower and upper parts of the matrix A.

   Teuchos::Array<local_ordinal_type> LI(MaxNumEntries);

   Teuchos::Array<local_ordinal_type> UI(MaxNumEntries);

   Teuchos::Array<scalar_type> LV(MaxNumEntries*blockMatSize);

   Teuchos::Array<scalar_type> UV(MaxNumEntries*blockMatSize);


   Teuchos::Array<scalar_type> diagValues(blockMatSize);


   L_block_->setAllToScalar (STM::zero ()); // Zero out L and U matrices

   U_block_->setAllToScalar (STM::zero ());

   D_block_->setAllToScalar (STM::zero ()); // Set diagonal values to zero


   // NOTE (mfh 27 May 2016) The factorization below occurs entirely on

   // host, so sync to host first.  The const_cast is unfortunate but

   // is our only option to make this correct.


   const_cast<block_crs_matrix_type&> (A).sync_host ();

   L_block_->sync_host ();

   U_block_->sync_host ();

   D_block_->sync_host ();

   // NOTE (mfh 27 May 2016) We're modifying L, U, and D on host.

   L_block_->modify_host ();

   U_block_->modify_host ();

   D_block_->modify_host ();


   RCP<const map_type> rowMap = L_block_->getRowMap ();


   // First we copy the user's matrix into L and U, regardless of fill level.

   // It is important to note that L and U are populated using local indices.

   // This means that if the row map GIDs are not monotonically increasing

   // (i.e., permuted or gappy), then the strictly lower (upper) part of the

   // matrix is not the one that you would get if you based L (U) on GIDs.

   // This is ok, as the *order* of the GIDs in the rowmap is a better

   // expression of the user's intent than the GIDs themselves.


   for (size_t myRow=0; myRow<A.getNodeNumRows(); ++myRow) {

     local_ordinal_type local_row = myRow;


     //TODO JJH 4April2014 An optimization is to use getLocalRowView.  Not all matrices support this,

     //                    we'd need to check via the Tpetra::RowMatrix method supportsRowViews().

     const local_ordinal_type * InI = 0;

     scalar_type * InV = 0;

     A.getLocalRowView(local_row, InI, InV, NumIn);


     // Split into L and U (we don't assume that indices are ordered).


     NumL = 0;

     NumU = 0;

     DiagFound = false;


     for (local_ordinal_type j = 0; j < NumIn; ++j) {

       const local_ordinal_type k = InI[j];

       const local_ordinal_type blockOffset = blockMatSize*j;


       if (k == local_row) {

         DiagFound = true;

         // Store perturbed diagonal in Tpetra::Vector D_

         for (local_ordinal_type jj = 0; jj < blockMatSize; ++jj)

           diagValues[jj] = this->Rthresh_ * InV[blockOffset+jj] + IFPACK2_SGN(InV[blockOffset+jj]) * this->Athresh_;

         D_block_->replaceLocalValues(local_row, &InI[j], diagValues.getRawPtr(), 1);

       }

       else if (k < 0) { // Out of range

         TEUCHOS_TEST_FOR_EXCEPTION(

           true, std::runtime_error, "Ifpack2::RILUK::initAllValues: current "

           "GID k = " << k << " < 0.  I'm not sure why this is an error; it is "

           "probably an artifact of the undocumented assumptions of the "

           "original implementation (likely copied and pasted from Ifpack).  "

           "Nevertheless, the code I found here insisted on this being an error "

           "state, so I will throw an exception here.");

       }

       else if (k < local_row) {

         LI[NumL] = k;

         const local_ordinal_type LBlockOffset = NumL*blockMatSize;

         for (local_ordinal_type jj = 0; jj < blockMatSize; ++jj)

           LV[LBlockOffset+jj] = InV[blockOffset+jj];

         NumL++;

       }

       else if (Teuchos::as<size_t>(k) <= rowMap->getNodeNumElements()) {

         UI[NumU] = k;

         const local_ordinal_type UBlockOffset = NumU*blockMatSize;

         for (local_ordinal_type jj = 0; jj < blockMatSize; ++jj)

           UV[UBlockOffset+jj] = InV[blockOffset+jj];

         NumU++;

       }

     }


     // Check in things for this row of L and U


     if (DiagFound) {

       ++NumNonzeroDiags;

     } else

     {

       for (local_ordinal_type jj = 0; jj < blockSize_; ++jj)

         diagValues[jj*(blockSize_+1)] = this->Athresh_;

       D_block_->replaceLocalValues(local_row, &local_row, diagValues.getRawPtr(), 1);

     }


     if (NumL) {

       L_block_->replaceLocalValues(local_row, &LI[0], &LV[0], NumL);

     }


     if (NumU) {

       U_block_->replaceLocalValues(local_row, &UI[0], &UV[0], NumU);

     }

   }


   // NOTE (mfh 27 May 2016) Sync back to device, in case compute()

   // ever gets a device implementation.

   {

     typedef typename block_crs_matrix_type::device_type device_type;

     const_cast<block_crs_matrix_type&> (A).template sync<device_type> ();

     L_block_->template sync<device_type> ();

     U_block_->template sync<device_type> ();

     D_block_->template sync<device_type> ();

   }

   this->isInitialized_ = true;

 }


 namespace { // (anonymous)


 // For a given Kokkos::View type, possibly unmanaged, get the

 // corresponding managed Kokkos::View type.  This is handy for

 // translating from little_block_type or little_vec_type (both

 // possibly unmanaged) to their managed versions.

 template<class LittleBlockType>

 struct GetManagedView {

   static_assert (Kokkos::Impl::is_view<LittleBlockType>::value,

                  "LittleBlockType must be a Kokkos::View.");

   typedef Kokkos::View<typename LittleBlockType::non_const_data_type,

                        typename LittleBlockType::array_layout,

                        typename LittleBlockType::device_type> managed_non_const_type;

   static_assert (static_cast<int> (managed_non_const_type::rank) ==

                  static_cast<int> (LittleBlockType::rank),

                  "managed_non_const_type::rank != LittleBlock::rank.  "

                  "Please report this bug to the Ifpack2 developers.");

 };


 } // namespace (anonymous)


 template<class MatrixType>

 void RBILUK<MatrixType>::compute ()

 {

   typedef impl_scalar_type IST;

   const char prefix[] = "Ifpack2::Experimental::RBILUK::compute: ";


   // initialize() checks this too, but it's easier for users if the

   // error shows them the name of the method that they actually

   // called, rather than the name of some internally called method.

   TEUCHOS_TEST_FOR_EXCEPTION

     (A_block_.is_null (), std::runtime_error, prefix << "The matrix (A_block_, "

      "the BlockCrsMatrix) is null.  Please call setMatrix() with a nonnull "

      "input before calling this method.");

   TEUCHOS_TEST_FOR_EXCEPTION

     (! A_block_->isFillComplete (), std::runtime_error, prefix << "The matrix "

      "(A_block_, the BlockCrsMatrix) is not fill complete.  You may not invoke "

      "initialize() or compute() with this matrix until the matrix is fill "

      "complete.  Note: BlockCrsMatrix is fill complete if and only if its "

      "underlying graph is fill complete.");


   if (! this->isInitialized ()) {

     initialize (); // Don't count this in the compute() time

   }


   // NOTE (mfh 27 May 2016) The factorization below occurs entirely on

   // host, so sync to host first.  The const_cast is unfortunate but

   // is our only option to make this correct.

   if (! A_block_.is_null ()) {

     Teuchos::RCP<block_crs_matrix_type> A_nc =

       Teuchos::rcp_const_cast<block_crs_matrix_type> (A_block_);

     A_nc->sync_host ();

   }

   L_block_->sync_host ();

   U_block_->sync_host ();

   D_block_->sync_host ();

   // NOTE (mfh 27 May 2016) We're modifying L, U, and D on host.

   L_block_->modify_host ();

   U_block_->modify_host ();

   D_block_->modify_host ();


   Teuchos::Time timer ("RBILUK::compute");

   { // Start timing

     Teuchos::TimeMonitor timeMon (timer);

     this->isComputed_ = false;


     // MinMachNum should be officially defined, for now pick something a little

     // bigger than IEEE underflow value


 //    const scalar_type MinDiagonalValue = STS::rmin ();

 //    const scalar_type MaxDiagonalValue = STS::one () / MinDiagonalValue;

     initAllValues (*A_block_);


     size_t NumIn;

     local_ordinal_type NumL, NumU, NumURead;


     // Get Maximum Row length

     const size_t MaxNumEntries =

       L_block_->getNodeMaxNumRowEntries () + U_block_->getNodeMaxNumRowEntries () + 1;


     const local_ordinal_type blockMatSize = blockSize_*blockSize_;


     // FIXME (mfh 08 Nov 2015, 24 May 2016) We need to move away from

     // expressing these strides explicitly, in order to finish #177

     // (complete Kokkos-ization of BlockCrsMatrix) thoroughly.

     const local_ordinal_type rowStride = blockSize_;


     Teuchos::Array<int> ipiv_teuchos(blockSize_);

     Kokkos::View<int*, Kokkos::HostSpace,

       Kokkos::MemoryUnmanaged> ipiv (ipiv_teuchos.getRawPtr (), blockSize_);

     Teuchos::Array<IST> work_teuchos(blockSize_);

     Kokkos::View<IST*, Kokkos::HostSpace,

       Kokkos::MemoryUnmanaged> work (work_teuchos.getRawPtr (), blockSize_);


     size_t num_cols = U_block_->getColMap()->getNodeNumElements();

     Teuchos::Array<int> colflag(num_cols);


     typename GetManagedView<little_block_type>::managed_non_const_type diagModBlock ("diagModBlock", blockSize_, blockSize_);

     typename GetManagedView<little_block_type>::managed_non_const_type matTmp ("matTmp", blockSize_, blockSize_);

     typename GetManagedView<little_block_type>::managed_non_const_type multiplier ("multiplier", blockSize_, blockSize_);


 //    Teuchos::ArrayRCP<scalar_type> DV = D_->get1dViewNonConst(); // Get view of diagonal


     // Now start the factorization.


     // Need some integer workspace and pointers

     local_ordinal_type NumUU;

     for (size_t j = 0; j < num_cols; ++j) {

       colflag[j] = -1;

     }

     Teuchos::Array<local_ordinal_type> InI(MaxNumEntries, 0);

     Teuchos::Array<scalar_type> InV(MaxNumEntries*blockMatSize,STM::zero());


     const local_ordinal_type numLocalRows = L_block_->getNodeNumRows ();

     for (local_ordinal_type local_row = 0; local_row < numLocalRows; ++local_row) {


       // Fill InV, InI with current row of L, D and U combined


       NumIn = MaxNumEntries;

       const local_ordinal_type * colValsL;

       scalar_type * valsL;


       L_block_->getLocalRowView(local_row, colValsL, valsL, NumL);

       for (local_ordinal_type j = 0; j < NumL; ++j)

       {

         const local_ordinal_type matOffset = blockMatSize*j;

         little_block_type lmat((typename little_block_type::value_type*) &valsL[matOffset],blockSize_,rowStride);

         little_block_type lmatV((typename little_block_type::value_type*) &InV[matOffset],blockSize_,rowStride);

         //lmatV.assign(lmat);

         Tpetra::COPY (lmat, lmatV);

         InI[j] = colValsL[j];

       }


       little_block_type dmat = D_block_->getLocalBlock(local_row, local_row);

       little_block_type dmatV((typename little_block_type::value_type*) &InV[NumL*blockMatSize], blockSize_, rowStride);

       //dmatV.assign(dmat);

       Tpetra::COPY (dmat, dmatV);

       InI[NumL] = local_row;


       const local_ordinal_type * colValsU;

       scalar_type * valsU;

       U_block_->getLocalRowView(local_row, colValsU, valsU, NumURead);

       NumU = 0;

       for (local_ordinal_type j = 0; j < NumURead; ++j)

       {

         if (!(colValsU[j] < numLocalRows)) continue;

         InI[NumL+1+j] = colValsU[j];

         const local_ordinal_type matOffset = blockMatSize*(NumL+1+j);

         little_block_type umat((typename little_block_type::value_type*) &valsU[blockMatSize*j], blockSize_, rowStride);

         little_block_type umatV((typename little_block_type::value_type*) &InV[matOffset], blockSize_, rowStride);

         //umatV.assign(umat);

         Tpetra::COPY (umat, umatV);

         NumU += 1;

       }

       NumIn = NumL+NumU+1;


       // Set column flags

       for (size_t j = 0; j < NumIn; ++j) {

         colflag[InI[j]] = j;

       }


 #ifndef IFPACK2_RBILUK_INITIAL

       for (local_ordinal_type i = 0; i < blockSize_; ++i)

         for (local_ordinal_type j = 0; j < blockSize_; ++j){

           {

             diagModBlock(i,j) = 0;

           }

         }

 #else

       scalar_type diagmod = STM::zero (); // Off-diagonal accumulator

       Kokkos::deep_copy (diagModBlock, diagmod);

 #endif


       for (local_ordinal_type jj = 0; jj < NumL; ++jj) {

         local_ordinal_type j = InI[jj];

         little_block_type currentVal((typename little_block_type::value_type*) &InV[jj*blockMatSize], blockSize_, rowStride); // current_mults++;

         //multiplier.assign(currentVal);

         Tpetra::COPY (currentVal, multiplier);


         const little_block_type dmatInverse = D_block_->getLocalBlock(j,j);

         // alpha = 1, beta = 0

 #ifndef IFPACK2_RBILUK_INITIAL_NOKK

         KokkosBatched::Experimental::SerialGemm

           <KokkosBatched::Experimental::Trans::NoTranspose,

           KokkosBatched::Experimental::Trans::NoTranspose,

           KokkosBatched::Experimental::Algo::Gemm::Blocked>::invoke

           (STS::one (), currentVal, dmatInverse, STS::zero (), matTmp);

 #else

         Tpetra::GEMM ("N", "N", STS::one (), currentVal, dmatInverse,

                       STS::zero (), matTmp);

 #endif

         //blockMatOpts.square_matrix_matrix_multiply(reinterpret_cast<impl_scalar_type*> (currentVal.data ()), reinterpret_cast<impl_scalar_type*> (dmatInverse.data ()), reinterpret_cast<impl_scalar_type*> (matTmp.data ()), blockSize_);

         //currentVal.assign(matTmp);

         Tpetra::COPY (matTmp, currentVal);


         const local_ordinal_type * UUI;

         scalar_type * UUV;

         U_block_->getLocalRowView(j, UUI, UUV, NumUU);


         if (this->RelaxValue_ == STM::zero ()) {

           for (local_ordinal_type k = 0; k < NumUU; ++k) {

             if (!(UUI[k] < numLocalRows)) continue;

             const int kk = colflag[UUI[k]];

             if (kk > -1) {

               little_block_type kkval((typename little_block_type::value_type*) &InV[kk*blockMatSize], blockSize_, rowStride);

               little_block_type uumat((typename little_block_type::value_type*) &UUV[k*blockMatSize], blockSize_, rowStride);

 #ifndef IFPACK2_RBILUK_INITIAL_NOKK

         KokkosBatched::Experimental::SerialGemm

           <KokkosBatched::Experimental::Trans::NoTranspose,

           KokkosBatched::Experimental::Trans::NoTranspose,

           KokkosBatched::Experimental::Algo::Gemm::Blocked>::invoke

           ( magnitude_type(-STM::one ()), multiplier, uumat, STM::one (), kkval);

 #else

               Tpetra::GEMM ("N", "N", magnitude_type(-STM::one ()), multiplier, uumat,

                             STM::one (), kkval);

 #endif

               //blockMatOpts.square_matrix_matrix_multiply(reinterpret_cast<impl_scalar_type*> (multiplier.data ()), reinterpret_cast<impl_scalar_type*> (uumat.data ()), reinterpret_cast<impl_scalar_type*> (kkval.data ()), blockSize_, -STM::one(), STM::one());

             }

           }

         }

         else {

           for (local_ordinal_type k = 0; k < NumUU; ++k) {

             if (!(UUI[k] < numLocalRows)) continue;

             const int kk = colflag[UUI[k]];

             little_block_type uumat((typename little_block_type::value_type*) &UUV[k*blockMatSize], blockSize_, rowStride);

             if (kk > -1) {

               little_block_type kkval((typename little_block_type::value_type*) &InV[kk*blockMatSize], blockSize_, rowStride);

 #ifndef IFPACK2_RBILUK_INITIAL_NOKK

         KokkosBatched::Experimental::SerialGemm

           <KokkosBatched::Experimental::Trans::NoTranspose,

           KokkosBatched::Experimental::Trans::NoTranspose,

           KokkosBatched::Experimental::Algo::Gemm::Blocked>::invoke

           (magnitude_type(-STM::one ()), multiplier, uumat, STM::one (), kkval);

 #else

               Tpetra::GEMM ("N", "N", magnitude_type(-STM::one ()), multiplier, uumat,

                             STM::one (), kkval);

 #endif

               //blockMatOpts.square_matrix_matrix_multiply(reinterpret_cast<impl_scalar_type*>(multiplier.data ()), reinterpret_cast<impl_scalar_type*>(uumat.data ()), reinterpret_cast<impl_scalar_type*>(kkval.data ()), blockSize_, -STM::one(), STM::one());

             }

             else {

 #ifndef IFPACK2_RBILUK_INITIAL_NOKK

         KokkosBatched::Experimental::SerialGemm

           <KokkosBatched::Experimental::Trans::NoTranspose,

           KokkosBatched::Experimental::Trans::NoTranspose,

           KokkosBatched::Experimental::Algo::Gemm::Blocked>::invoke

           (magnitude_type(-STM::one ()), multiplier, uumat, STM::one (), diagModBlock);

 #else

               Tpetra::GEMM ("N", "N", magnitude_type(-STM::one ()), multiplier, uumat,

                             STM::one (), diagModBlock);

 #endif

               //blockMatOpts.square_matrix_matrix_multiply(reinterpret_cast<impl_scalar_type*>(multiplier.data ()), reinterpret_cast<impl_scalar_type*>(uumat.data ()), reinterpret_cast<impl_scalar_type*>(diagModBlock.data ()), blockSize_, -STM::one(), STM::one());

             }

           }

         }

       }

       if (NumL) {

         // Replace current row of L

         L_block_->replaceLocalValues (local_row, InI.getRawPtr (), InV.getRawPtr (), NumL);

       }


       // dmat.assign(dmatV);

       Tpetra::COPY (dmatV, dmat);


       if (this->RelaxValue_ != STM::zero ()) {

         //dmat.update(this->RelaxValue_, diagModBlock);

         Tpetra::AXPY (this->RelaxValue_, diagModBlock, dmat);

       }


 //      if (STS::magnitude (DV[i]) > STS::magnitude (MaxDiagonalValue)) {

 //        if (STS::real (DV[i]) < STM::zero ()) {

 //          DV[i] = -MinDiagonalValue;

 //        }

 //        else {

 //          DV[i] = MinDiagonalValue;

 //        }

 //      }

 //      else

       {

         int lapackInfo = 0;

         for (int k = 0; k < blockSize_; ++k) {

           ipiv[k] = 0;

         }


         Tpetra::GETF2 (dmat, ipiv, lapackInfo);

         //lapack.GETRF(blockSize_, blockSize_, d_raw, blockSize_, ipiv.getRawPtr(), &lapackInfo);

         TEUCHOS_TEST_FOR_EXCEPTION(

           lapackInfo != 0, std::runtime_error, "Ifpack2::Experimental::RBILUK::compute: "

           "lapackInfo = " << lapackInfo << " which indicates an error in the factorization GETRF.");


         Tpetra::GETRI (dmat, ipiv, work, lapackInfo);

         //lapack.GETRI(blockSize_, d_raw, blockSize_, ipiv.getRawPtr(), work.getRawPtr(), lwork, &lapackInfo);

         TEUCHOS_TEST_FOR_EXCEPTION(

           lapackInfo != 0, std::runtime_error, "Ifpack2::Experimental::RBILUK::compute: "

           "lapackInfo = " << lapackInfo << " which indicates an error in the matrix inverse GETRI.");

       }


       for (local_ordinal_type j = 0; j < NumU; ++j) {

         little_block_type currentVal((typename little_block_type::value_type*) &InV[(NumL+1+j)*blockMatSize], blockSize_, rowStride); // current_mults++;

         // scale U by the diagonal inverse

 #ifndef IFPACK2_RBILUK_INITIAL_NOKK

         KokkosBatched::Experimental::SerialGemm

           <KokkosBatched::Experimental::Trans::NoTranspose,

           KokkosBatched::Experimental::Trans::NoTranspose,

           KokkosBatched::Experimental::Algo::Gemm::Blocked>::invoke

           (STS::one (), dmat, currentVal, STS::zero (), matTmp);

 #else

         Tpetra::GEMM ("N", "N", STS::one (), dmat, currentVal,

                                     STS::zero (), matTmp);

 #endif

         //blockMatOpts.square_matrix_matrix_multiply(reinterpret_cast<impl_scalar_type*>(dmat.data ()), reinterpret_cast<impl_scalar_type*>(currentVal.data ()), reinterpret_cast<impl_scalar_type*>(matTmp.data ()), blockSize_);

         //currentVal.assign(matTmp);

         Tpetra::COPY (matTmp, currentVal);

       }


       if (NumU) {

         // Replace current row of L and U

         U_block_->replaceLocalValues (local_row, &InI[NumL+1], &InV[blockMatSize*(NumL+1)], NumU);

       }


 #ifndef IFPACK2_RBILUK_INITIAL

       // Reset column flags

       for (size_t j = 0; j < NumIn; ++j) {

         colflag[InI[j]] = -1;

       }

 #else

       // Reset column flags

       for (size_t j = 0; j < num_cols; ++j) {

         colflag[j] = -1;

       }

 #endif

     }


   } // Stop timing


   // Sync everything back to device, for efficient solves.

   {

     typedef typename block_crs_matrix_type::device_type device_type;

     if (! A_block_.is_null ()) {

       Teuchos::RCP<block_crs_matrix_type> A_nc =

         Teuchos::rcp_const_cast<block_crs_matrix_type> (A_block_);

       A_nc->template sync<device_type> ();

     }

     L_block_->template sync<device_type> ();

     U_block_->template sync<device_type> ();

     D_block_->template sync<device_type> ();

   }


   this->isComputed_ = true;

   this->numCompute_ += 1;

   this->computeTime_ += timer.totalElapsedTime ();

 }


 template<class MatrixType>

 void

 RBILUK<MatrixType>::

 apply (const Tpetra::MultiVector<scalar_type,local_ordinal_type,global_ordinal_type,node_type>& X,

        Tpetra::MultiVector<scalar_type,local_ordinal_type,global_ordinal_type,node_type>& Y,

        Teuchos::ETransp mode,

        scalar_type alpha,

        scalar_type beta) const

 {

   using Teuchos::RCP;

   typedef Tpetra::BlockMultiVector<scalar_type,

     local_ordinal_type, global_ordinal_type, node_type> BMV;

   typedef Tpetra::MultiVector<scalar_type,

     local_ordinal_type, global_ordinal_type, node_type> MV;


   TEUCHOS_TEST_FOR_EXCEPTION(

     A_block_.is_null (), std::runtime_error, "Ifpack2::Experimental::RBILUK::apply: The matrix is "

     "null.  Please call setMatrix() with a nonnull input, then initialize() "

     "and compute(), before calling this method.");

   TEUCHOS_TEST_FOR_EXCEPTION(

     ! this->isComputed (), std::runtime_error,

     "Ifpack2::Experimental::RBILUK::apply: If you have not yet called compute(), "

     "you must call compute() before calling this method.");

   TEUCHOS_TEST_FOR_EXCEPTION(

     X.getNumVectors () != Y.getNumVectors (), std::invalid_argument,

     "Ifpack2::Experimental::RBILUK::apply: X and Y do not have the same number of columns.  "

     "X.getNumVectors() = " << X.getNumVectors ()

     << " != Y.getNumVectors() = " << Y.getNumVectors () << ".");

   TEUCHOS_TEST_FOR_EXCEPTION(

     STS::isComplex && mode == Teuchos::CONJ_TRANS, std::logic_error,

     "Ifpack2::Experimental::RBILUK::apply: mode = Teuchos::CONJ_TRANS is not implemented for "

     "complex Scalar type.  Please talk to the Ifpack2 developers to get this "

     "fixed.  There is a FIXME in this file about this very issue.");


   const local_ordinal_type blockMatSize = blockSize_*blockSize_;


   const local_ordinal_type rowStride = blockSize_;


   BMV yBlock (Y, * (A_block_->getGraph ()->getDomainMap ()), blockSize_);

   const BMV xBlock (X, * (A_block_->getColMap ()), blockSize_);


   Teuchos::Array<scalar_type> lclarray(blockSize_);

   little_vec_type lclvec((typename little_vec_type::value_type*)&lclarray[0], blockSize_);

   const scalar_type one = STM::one ();

   const scalar_type zero = STM::zero ();


   Teuchos::Time timer ("RBILUK::apply");

   { // Start timing

     Teuchos::TimeMonitor timeMon (timer);

     if (alpha == one && beta == zero) {

       if (mode == Teuchos::NO_TRANS) { // Solve L (D (U Y)) = X for Y.

         // Start by solving L C = X for C.  C must have the same Map

         // as D.  We have to use a temp multivector, since our

         // implementation of triangular solves does not allow its

         // input and output to alias one another.

         //

         // FIXME (mfh 24 Jan 2014) Cache this temp multivector.

         const local_ordinal_type numVectors = xBlock.getNumVectors();

         BMV cBlock (* (A_block_->getGraph ()->getDomainMap ()), blockSize_, numVectors);

         BMV rBlock (* (A_block_->getGraph ()->getDomainMap ()), blockSize_, numVectors);

         for (local_ordinal_type imv = 0; imv < numVectors; ++imv)

         {

           for (size_t i = 0; i < D_block_->getNodeNumRows(); ++i)

           {

             local_ordinal_type local_row = i;

             little_vec_type xval = xBlock.getLocalBlock(local_row,imv);

             little_vec_type cval = cBlock.getLocalBlock(local_row,imv);

             //cval.assign(xval);

             Tpetra::COPY (xval, cval);


             local_ordinal_type NumL;

             const local_ordinal_type * colValsL;

             scalar_type * valsL;


             L_block_->getLocalRowView(local_row, colValsL, valsL, NumL);


             for (local_ordinal_type j = 0; j < NumL; ++j)

             {

               local_ordinal_type col = colValsL[j];

               little_vec_type prevVal = cBlock.getLocalBlock(col, imv);


               const local_ordinal_type matOffset = blockMatSize*j;

               little_block_type lij((typename little_block_type::value_type*) &valsL[matOffset],blockSize_,rowStride);


               //cval.matvecUpdate(-one, lij, prevVal);

               Tpetra::GEMV (-one, lij, prevVal, cval);

             }

           }

         }


         // Solve D R = C. Note that D has been replaced by D^{-1} at this point.

         D_block_->applyBlock(cBlock, rBlock);


         // Solve U Y = R.

         for (local_ordinal_type imv = 0; imv < numVectors; ++imv)

         {

           const local_ordinal_type numRows = D_block_->getNodeNumRows();

           for (local_ordinal_type i = 0; i < numRows; ++i)

           {

             local_ordinal_type local_row = (numRows-1)-i;

             little_vec_type rval = rBlock.getLocalBlock(local_row,imv);

             little_vec_type yval = yBlock.getLocalBlock(local_row,imv);

             //yval.assign(rval);

             Tpetra::COPY (rval, yval);


             local_ordinal_type NumU;

             const local_ordinal_type * colValsU;

             scalar_type * valsU;


             U_block_->getLocalRowView(local_row, colValsU, valsU, NumU);


             for (local_ordinal_type j = 0; j < NumU; ++j)

             {

               local_ordinal_type col = colValsU[NumU-1-j];

               little_vec_type prevVal = yBlock.getLocalBlock(col, imv);


               const local_ordinal_type matOffset = blockMatSize*(NumU-1-j);

               little_block_type uij((typename little_block_type::value_type*) &valsU[matOffset], blockSize_, rowStride);


               //yval.matvecUpdate(-one, uij, prevVal);

               Tpetra::GEMV (-one, uij, prevVal, yval);

             }

           }

         }

       }

       else { // Solve U^P (D^P (L^P Y)) = X for Y (where P is * or T).

         TEUCHOS_TEST_FOR_EXCEPTION(

           true, std::runtime_error,

           "Ifpack2::Experimental::RBILUK::apply: transpose apply is not implemented for the block algorithm. ");

       }

     }

     else { // alpha != 1 or beta != 0

       if (alpha == zero) {

         if (beta == zero) {

           Y.putScalar (zero);

         } else {

           Y.scale (beta);

         }

       } else { // alpha != zero

         MV Y_tmp (Y.getMap (), Y.getNumVectors ());

         apply (X, Y_tmp, mode);

         Y.update (alpha, Y_tmp, beta);

       }

     }

   } // Stop timing


   this->numApply_ += 1;

   this->applyTime_ = timer.totalElapsedTime ();

 }


 template<class MatrixType>

 std::string RBILUK<MatrixType>::description () const

 {

   std::ostringstream os;


   // Output is a valid YAML dictionary in flow style.  If you don't

   // like everything on a single line, you should call describe()

   // instead.

   os << "\"Ifpack2::Experimental::RBILUK\": {";

   os << "Initialized: " << (this->isInitialized () ? "true" : "false") << ", "

      << "Computed: " << (this->isComputed () ? "true" : "false") << ", ";


   os << "Level-of-fill: " << this->getLevelOfFill() << ", ";


   if (A_block_.is_null ()) {

     os << "Matrix: null";

   }

   else {

     os << "Global matrix dimensions: ["

        << A_block_->getGlobalNumRows () << ", " << A_block_->getGlobalNumCols () << "]"

        << ", Global nnz: " << A_block_->getGlobalNumEntries();

   }


   os << "}";

   return os.str ();

 }


 } // namespace Experimental


 } // namespace Ifpack2


 // FIXME (mfh 26 Aug 2015) We only need to do instantiation for

 // MatrixType = Tpetra::RowMatrix.  Conversions to BlockCrsMatrix are

 // handled internally via dynamic cast.


 #define IFPACK2_EXPERIMENTAL_RBILUK_INSTANT(S,LO,GO,N)                            \

   template class Ifpack2::Experimental::RBILUK< Tpetra::BlockCrsMatrix<S, LO, GO, N> >; \

   template class Ifpack2::Experimental::RBILUK< Tpetra::RowMatrix<S, LO, GO, N> >;


 #endif

Ifpack2::Experimental::RBILUK::initialize
void initialize()
Initialize by computing the symbolic incomplete factorization.
Definition: Ifpack2_Experimental_RBILUK_def.hpp:187

Ifpack2::Experimental::RBILUK::global_ordinal_type
MatrixType::global_ordinal_type global_ordinal_type
The type of global indices in the input MatrixType.
Definition: Ifpack2_Experimental_RBILUK_decl.hpp:145

Ifpack2::Experimental::RBILUK::~RBILUK
virtual ~RBILUK()
Destructor (declared virtual for memory safety).
Definition: Ifpack2_Experimental_RBILUK_def.hpp:81

Ifpack2::Experimental::RBILUK::getBlockMatrix
Teuchos::RCP< const block_crs_matrix_type > getBlockMatrix() const
Get the input matrix.
Definition: Ifpack2_Experimental_RBILUK_def.hpp:182

Ifpack2::Experimental::RBILUK::getUBlock
const block_crs_matrix_type & getUBlock() const
Return the U factor of the ILU factorization.
Definition: Ifpack2_Experimental_RBILUK_def.hpp:139

Ifpack2::Experimental::RBILUK::scalar_type
MatrixType::scalar_type scalar_type
The type of the entries of the input MatrixType.
Definition: Ifpack2_Experimental_RBILUK_decl.hpp:136

Ifpack2::Experimental::RBILUK::apply
void apply(const Tpetra::MultiVector< scalar_type, local_ordinal_type, global_ordinal_type, node_type > &X, Tpetra::MultiVector< scalar_type, local_ordinal_type, global_ordinal_type, node_type > &Y, Teuchos::ETransp mode=Teuchos::NO_TRANS, scalar_type alpha=Teuchos::ScalarTraits< scalar_type >::one(), scalar_type beta=Teuchos::ScalarTraits< scalar_type >::zero()) const
Apply the (inverse of the) incomplete factorization to X, resulting in Y.
Definition: Ifpack2_Experimental_RBILUK_def.hpp:782

TEUCHOS_TEST_FOR_EXCEPTION
#define TEUCHOS_TEST_FOR_EXCEPTION(throw_exception_test, Exception, msg)

Teuchos::ArrayView::size
size_type size() const

Ifpack2::Experimental::RBILUK::magnitude_type
Teuchos::ScalarTraits< scalar_type >::magnitudeType magnitude_type
The type of the magnitude (absolute value) of a matrix entry.
Definition: Ifpack2_Experimental_RBILUK_decl.hpp:151

Ifpack2::RILUK
ILU(k) factorization of a given Tpetra::RowMatrix.
Definition: Ifpack2_RILUK_decl.hpp:243

Teuchos::Array::getRawPtr
T * getRawPtr()

Ifpack2::Experimental::RBILUK::node_type
MatrixType::node_type node_type
The Node type used by the input MatrixType.
Definition: Ifpack2_Experimental_RBILUK_decl.hpp:148

Ifpack2::Experimental::RBILUK::local_ordinal_type
MatrixType::local_ordinal_type local_ordinal_type
The type of local indices in the input MatrixType.
Definition: Ifpack2_Experimental_RBILUK_decl.hpp:142

Teuchos::RCP::getRawPtr
T * getRawPtr() const

Teuchos::CONJ_TRANS

Ifpack2::Experimental::RBILUK::getDBlock
const block_crs_matrix_type & getDBlock() const
Return the diagonal entries of the ILU factorization.
Definition: Ifpack2_Experimental_RBILUK_def.hpp:125

Teuchos::rcp
TEUCHOS_DEPRECATED RCP< T > rcp(T *p, Dealloc_T dealloc, bool owns_mem)

Ifpack2::Experimental::RBILUK::compute
void compute()
Compute the (numeric) incomplete factorization.
Definition: Ifpack2_Experimental_RBILUK_def.hpp:448

Teuchos::Time

Ifpack2_Utilities.hpp
File for utility functions.

Ifpack2::IlukGraph
Construct a level filled graph for use in computing an ILU(k) incomplete factorization.
Definition: Ifpack2_IlukGraph.hpp:97

Teuchos::ArrayView

Ifpack2::Experimental::RBILUK::setMatrix
void setMatrix(const Teuchos::RCP< const block_crs_matrix_type > &A)
Change the matrix to be preconditioned.
Definition: Ifpack2_Experimental_RBILUK_def.hpp:86

Ifpack2::Experimental::RBILUK::getLBlock
const block_crs_matrix_type & getLBlock() const
Return the L factor of the ILU factorization.
Definition: Ifpack2_Experimental_RBILUK_def.hpp:111

Ifpack2::OverlappingRowMatrix
Sparse matrix (Tpetra::RowMatrix subclass) with ghost rows.
Definition: Ifpack2_OverlappingRowMatrix_decl.hpp:58

Teuchos::Time::totalElapsedTime
double totalElapsedTime(bool readCurrentTime=false) const

Teuchos::RCP< const row_matrix_type >

Ifpack2::LocalFilter
Access only local rows and columns of a sparse matrix.
Definition: Ifpack2_LocalFilter_decl.hpp:160

Ifpack2::Experimental::RBILUK::row_matrix_type
Tpetra::RowMatrix< scalar_type, local_ordinal_type, global_ordinal_type, node_type > row_matrix_type
Tpetra::RowMatrix specialization used by this class.
Definition: Ifpack2_Experimental_RBILUK_decl.hpp:157

Ifpack2::Experimental::RBILUK::description
std::string description() const
A one-line description of this object.
Definition: Ifpack2_Experimental_RBILUK_def.hpp:931

Ifpack2::Experimental::RBILUK
ILU(k) factorization of a given Tpetra::BlockCrsMatrix.
Definition: Ifpack2_Experimental_RBILUK_decl.hpp:128

Teuchos::NO_TRANS

Teuchos::ETransp
ETransp

Teuchos::TimeMonitor

Teuchos::Array< local_ordinal_type >