46 #ifndef MUELU_UTILITIESBASE_DEF_HPP
47 #define MUELU_UTILITIESBASE_DEF_HPP
53 #include <Kokkos_Core.hpp>
54 #include <KokkosSparse_CrsMatrix.hpp>
55 #include <KokkosSparse_getDiagCopy.hpp>
57 #include <Xpetra_BlockedVector.hpp>
58 #include <Xpetra_BlockedMap.hpp>
59 #include <Xpetra_BlockedMultiVector.hpp>
67 #include <Xpetra_CrsMatrixWrap.hpp>
68 #include <Xpetra_StridedMap.hpp>
72 #include <KokkosKernels_Handle.hpp>
73 #include <KokkosGraph_RCM.hpp>
77 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
78 RCP<Xpetra::Matrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>>
83 return rcp(
new CrsMatrixWrap(Op));
86 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
92 RCP<CrsMatrixWrap> Aout =
rcp(
new CrsMatrixWrap(rowmap, expectedNNZperRow <= 0 ? Ain->getGlobalMaxNumRowEntries() : expectedNNZperRow));
94 for (
size_t row = 0; row < Ain->getLocalNumRows(); row++) {
95 size_t nnz = Ain->getNumEntriesInLocalRow(row);
99 Ain->getLocalRowView(row, indices, vals);
105 size_t nNonzeros = 0;
108 LocalOrdinal lclColIdx = colmap->getLocalElement(glbRow);
109 for (
size_t i = 0; i < (size_t)indices.
size(); i++) {
111 indout[nNonzeros] = colmap->getGlobalElement(indices[i]);
112 valout[nNonzeros] = vals[i];
117 for (
size_t i = 0; i < (size_t)indices.
size(); i++) {
119 indout[nNonzeros] = colmap->getGlobalElement(indices[i]);
120 valout[nNonzeros] = vals[i];
126 valout.resize(nNonzeros);
128 Aout->insertGlobalValues(Ain->getRowMap()->getGlobalElement(row), indout.view(0, indout.size()), valout.view(0, valout.size()));
130 Aout->fillComplete(Ain->getDomainMap(), Ain->getRangeMap());
135 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
140 RCP<CrsGraph> sparsityPattern = CrsGraphFactory::Build(A->getRowMap(), expectedNNZperRow <= 0 ? A->getGlobalMaxNumRowEntries() : expectedNNZperRow);
142 RCP<Vector> diag = GetMatrixOverlappedDiagonal(*A);
145 for (
size_t row = 0; row < A->getLocalNumRows(); row++) {
148 A->getLocalRowView(row, indices, vals);
150 GlobalOrdinal globalRow = A->getRowMap()->getGlobalElement(row);
151 LocalOrdinal col = A->getColMap()->getLocalElement(globalRow);
153 const Scalar Dk = STS::magnitude(D[col]) > 0.0 ? STS::magnitude(D[col]) : 1.0;
156 for (
size_t i = 0; i < size_t(indices.
size()); i++)
158 if (col == indices[i] || STS::magnitude(STS::squareroot(Dk) * vals[i] * STS::squareroot(Dk)) > STS::magnitude(threshold))
159 indicesNew.
append(A->getColMap()->getGlobalElement(indices[i]));
163 sparsityPattern->fillComplete();
165 return sparsityPattern;
168 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
172 size_t numRows = A.getRowMap()->getLocalNumElements();
176 for (
size_t i = 0; i < numRows; ++i) {
179 for (; j < cols.
size(); ++j) {
180 if (Teuchos::as<size_t>(cols[j]) == i) {
185 if (j == cols.
size()) {
193 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
197 const auto rowMap = A.getRowMap();
200 const CrsMatrixWrap* crsOp =
dynamic_cast<const CrsMatrixWrap*
>(&A);
202 using local_vector_type =
typename Vector::dual_view_type::t_dev_um;
203 using device_type =
typename CrsGraph::device_type;
204 Kokkos::View<size_t*, device_type> offsets(
"offsets", rowMap->getLocalNumElements());
205 crsOp->getCrsGraph()->getLocalDiagOffsets(offsets);
206 crsOp->getCrsMatrix()->getLocalDiagCopy(*diag, offsets);
208 A.getLocalDiagCopy(*diag);
230 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
236 const bool doLumped) {
249 using local_matrix_type =
typename Matrix::local_matrix_type;
251 using value_type =
typename local_matrix_type::value_type;
252 using values_type =
typename local_matrix_type::values_type;
253 using scalar_type =
typename values_type::non_const_value_type;
254 using ordinal_type =
typename local_matrix_type::ordinal_type;
255 using execution_space =
typename local_matrix_type::execution_space;
262 using KAT = Kokkos::ArithTraits<value_type>;
266 RCP<Vector> diag = VectorFactory::Build(rowMap,
false);
269 local_matrix_type localMatrix = A.getLocalMatrixDevice();
270 auto diagVals = diag->getDeviceLocalView(Xpetra::Access::ReadWrite);
272 ordinal_type numRows = localMatrix.graph.numRows();
274 scalar_type valReplacement_dev = valReplacement;
281 Kokkos::parallel_for(
282 "Utilities::GetMatrixDiagonalInverse",
283 Kokkos::RangePolicy<ordinal_type, execution_space>(0, numRows),
284 KOKKOS_LAMBDA(
const ordinal_type rowIdx) {
285 bool foundDiagEntry =
false;
286 auto myRow = localMatrix.rowConst(rowIdx);
287 for (ordinal_type entryIdx = 0; entryIdx < myRow.length; ++entryIdx) {
288 if (myRow.colidx(entryIdx) == rowIdx) {
289 foundDiagEntry =
true;
290 if (KAT::magnitude(myRow.value(entryIdx)) > KAT::magnitude(tol)) {
291 diagVals(rowIdx, 0) = KAT::one() / myRow.value(entryIdx);
293 diagVals(rowIdx, 0) = valReplacement_dev;
299 if (!foundDiagEntry) {
300 diagVals(rowIdx, 0) = KAT::zero();
304 Kokkos::parallel_for(
305 "Utilities::GetMatrixDiagonalInverse",
306 Kokkos::RangePolicy<ordinal_type, execution_space>(0, numRows),
307 KOKKOS_LAMBDA(
const ordinal_type rowIdx) {
308 auto myRow = localMatrix.rowConst(rowIdx);
309 for (ordinal_type entryIdx = 0; entryIdx < myRow.length; ++entryIdx) {
310 diagVals(rowIdx, 0) += KAT::magnitude(myRow.value(entryIdx));
312 if (KAT::magnitude(diagVals(rowIdx, 0)) > KAT::magnitude(tol))
313 diagVals(rowIdx, 0) = KAT::one() / diagVals(rowIdx, 0);
315 diagVals(rowIdx, 0) = valReplacement_dev;
321 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
327 const bool replaceSingleEntryRowWithZero,
328 const bool useAverageAbsDiagVal) {
332 const Scalar zero = TST::zero();
333 const Scalar one = TST::one();
334 const Scalar two = one + one;
340 if (bA == Teuchos::null) {
344 if (rowMap->lib() == Xpetra::UnderlyingLib::UseTpetra) {
347 using local_vector_type =
typename Vector::dual_view_type::t_dev_um;
348 using local_matrix_type =
typename Matrix::local_matrix_type;
349 using execution_space =
typename local_vector_type::execution_space;
352 using values_type =
typename local_matrix_type::values_type;
353 using scalar_type =
typename values_type::non_const_value_type;
354 using mag_type =
typename Kokkos::ArithTraits<scalar_type>::mag_type;
355 using KAT_S =
typename Kokkos::ArithTraits<scalar_type>;
356 using KAT_M =
typename Kokkos::ArithTraits<mag_type>;
357 using size_type =
typename local_matrix_type::non_const_size_type;
359 local_vector_type diag_dev = diag->getDeviceLocalView(Xpetra::Access::OverwriteAll);
360 local_matrix_type local_mat_dev = rcpA->getLocalMatrixDevice();
361 Kokkos::RangePolicy<execution_space, int> my_policy(0, static_cast<int>(diag_dev.extent(0)));
362 scalar_type valReplacement_dev = valReplacement;
365 Kokkos::View<int*, execution_space> nnzPerRow(
"nnz per rows", diag_dev.extent(0));
366 Kokkos::View<scalar_type*, execution_space> regSum(
"regSum", diag_dev.extent(0));
367 Kokkos::View<mag_type, execution_space> avgAbsDiagVal_dev(
"avgAbsDiagVal");
368 Kokkos::View<int, execution_space> numDiagsEqualToOne_dev(
"numDiagsEqualToOne");
372 Kokkos::parallel_for(
373 "GetLumpedMatrixDiagonal", my_policy,
374 KOKKOS_LAMBDA(
const int rowIdx) {
375 diag_dev(rowIdx, 0) = KAT_S::zero();
376 for (size_type entryIdx = local_mat_dev.graph.row_map(rowIdx);
377 entryIdx < local_mat_dev.graph.row_map(rowIdx + 1);
379 regSum(rowIdx) += local_mat_dev.values(entryIdx);
380 if (KAT_M::zero() < KAT_S::abs(local_mat_dev.values(entryIdx))) {
383 diag_dev(rowIdx, 0) += KAT_S::abs(local_mat_dev.values(entryIdx));
384 if (rowIdx == local_mat_dev.graph.entries(entryIdx)) {
385 Kokkos::atomic_add(&avgAbsDiagVal_dev(), KAT_S::abs(local_mat_dev.values(entryIdx)));
389 if (nnzPerRow(rowIdx) == 1 && KAT_S::magnitude(diag_dev(rowIdx, 0)) == KAT_M::one()) {
390 Kokkos::atomic_add(&numDiagsEqualToOne_dev(), 1);
394 if (useAverageAbsDiagVal) {
396 typename Kokkos::View<mag_type, execution_space>::HostMirror avgAbsDiagVal = Kokkos::create_mirror_view(avgAbsDiagVal_dev);
397 Kokkos::deep_copy(avgAbsDiagVal, avgAbsDiagVal_dev);
398 int numDiagsEqualToOne;
399 Kokkos::deep_copy(numDiagsEqualToOne, numDiagsEqualToOne_dev);
406 Kokkos::parallel_for(
407 "ComputeLumpedDiagonalInverse", my_policy,
408 KOKKOS_LAMBDA(
const int rowIdx) {
409 if (replaceSingleEntryRowWithZero && nnzPerRow(rowIdx) <= 1) {
410 diag_dev(rowIdx, 0) = KAT_S::zero();
411 }
else if ((diag_dev(rowIdx, 0) != KAT_S::zero()) && (KAT_S::magnitude(diag_dev(rowIdx, 0)) < KAT_S::magnitude(2 * regSum(rowIdx)))) {
412 diag_dev(rowIdx, 0) = KAT_S::one() / KAT_S::magnitude(2 * regSum(rowIdx));
414 if (KAT_S::magnitude(diag_dev(rowIdx, 0)) > tol) {
415 diag_dev(rowIdx, 0) = KAT_S::one() / diag_dev(rowIdx, 0);
417 diag_dev(rowIdx, 0) = valReplacement_dev;
425 Kokkos::parallel_for(
426 "GetLumpedMatrixDiagonal", my_policy,
427 KOKKOS_LAMBDA(
const int rowIdx) {
428 diag_dev(rowIdx, 0) = KAT_S::zero();
429 for (size_type entryIdx = local_mat_dev.graph.row_map(rowIdx);
430 entryIdx < local_mat_dev.graph.row_map(rowIdx + 1);
432 diag_dev(rowIdx, 0) += KAT_S::magnitude(local_mat_dev.values(entryIdx));
444 std::vector<int> nnzPerRow(rowMap->getLocalNumElements());
449 const Magnitude zeroMagn = TST::magnitude(zero);
450 Magnitude avgAbsDiagVal = TST::magnitude(zero);
451 int numDiagsEqualToOne = 0;
452 for (
size_t i = 0; i < rowMap->getLocalNumElements(); ++i) {
454 rcpA->getLocalRowView(i, cols, vals);
457 regSum[i] += vals[j];
458 const Magnitude rowEntryMagn = TST::magnitude(vals[j]);
459 if (rowEntryMagn > zeroMagn)
461 diagVals[i] += rowEntryMagn;
462 if (static_cast<size_t>(cols[j]) == i)
463 avgAbsDiagVal += rowEntryMagn;
465 if (nnzPerRow[i] == 1 && TST::magnitude(diagVals[i]) == 1.)
466 numDiagsEqualToOne++;
468 if (useAverageAbsDiagVal)
471 for (
size_t i = 0; i < rowMap->getLocalNumElements(); ++i) {
472 if (replaceSingleEntryRowWithZero && nnzPerRow[i] <= static_cast<int>(1))
474 else if ((diagVals[i] != zero) && (TST::magnitude(diagVals[i]) < TST::magnitude(two * regSum[i])))
475 diagVals[i] = one / TST::magnitude((two * regSum[i]));
477 if (TST::magnitude(diagVals[i]) > tol)
478 diagVals[i] = one / diagVals[i];
480 diagVals[i] = valReplacement;
488 "UtilitiesBase::GetLumpedMatrixDiagonal(): extracting reciprocal of diagonal of a blocked matrix is not supported");
491 for (
size_t row = 0; row < bA->Rows(); ++row) {
492 for (
size_t col = 0; col < bA->Cols(); ++col) {
493 if (!bA->getMatrix(row, col).
is_null()) {
496 RCP<Vector> ddtemp = bA->getRangeMapExtractor()->ExtractVector(diag, row, bThyraMode);
498 ddtemp->update(Teuchos::as<Scalar>(1.0), *dd, Teuchos::as<Scalar>(1.0));
499 bA->getRangeMapExtractor()->InsertVector(ddtemp, row, diag, bThyraMode);
508 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
512 size_t numRows = A.getRowMap()->getLocalNumElements();
517 for (
size_t i = 0; i < numRows; ++i) {
521 if (Teuchos::as<size_t>(cols[j]) != i) {
530 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
534 TEUCHOS_TEST_FOR_EXCEPTION(!A.getColMap()->isSameAs(*BlockNumber.
getMap()), std::runtime_error,
"GetMatrixMaxMinusOffDiagonal: BlockNumber must match's A's column map.");
538 size_t numRows = A.getRowMap()->getLocalNumElements();
543 for (
size_t i = 0; i < numRows; ++i) {
547 if (Teuchos::as<size_t>(cols[j]) != i && block_id[i] == block_id[cols[j]]) {
558 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
566 if (bv.is_null() ==
false) {
570 for (
size_t r = 0; r < bmap->getNumMaps(); ++r) {
574 bret->setMultiVector(r, subvecinf, bmap->getThyraMode());
582 for (
size_t i = 0; i < v->getMap()->getLocalNumElements(); ++i) {
586 retVals[i] = valReplacement;
629 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
635 RCP<Vector> diagonal = VectorFactory::Build(colMap);
637 if (importer == Teuchos::null) {
638 importer = ImportFactory::Build(rowMap, colMap);
645 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
654 if (!browMap.
is_null()) rowMap = browMap->getMap();
660 for (
LO row = 0; row < static_cast<LO>(A.getRowMap()->getLocalNumElements()); ++row) {
668 for (
LO colID = 0; colID < static_cast<LO>(nnz); colID++) {
669 if (indices[colID] != row) {
678 if (importer == Teuchos::null) {
685 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
697 if (!browMap.
is_null()) rowMap = browMap->getMap();
703 for (
LO rowIdx = 0; rowIdx < static_cast<LO>(A.getRowMap()->getLocalNumElements()); ++rowIdx) {
711 for (
LO colID = 0; colID < static_cast<LO>(nnz); ++colID) {
712 if (indices[colID] != rowIdx) {
713 si += STS::magnitude(vals[colID]);
716 localVals[rowIdx] = si;
721 if (importer == Teuchos::null) {
728 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
733 const size_t numVecs = X.getNumVectors();
740 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
745 const size_t numVecs = X.getNumVectors();
746 Residual(Op, X, RHS, Resid);
752 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
757 const size_t numVecs = X.getNumVectors();
760 Op.residual(X, RHS, *RES);
764 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
769 Op.residual(X, RHS, Resid);
772 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
778 "Utils::PowerMethod: operator must have domain and range maps that are equivalent.");
783 diagInvVec = GetMatrixDiagonalInverse(A);
786 Scalar lambda = PowerMethod(A, diagInvVec, niters, tolerance, verbose, seed);
790 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
793 PowerMethod(
const Matrix& A,
const RCP<Vector>& diagInvVec,
796 "Utils::PowerMethod: operator must have domain and range maps that are equivalent.");
810 const Scalar zero = STS::zero(), one = STS::one();
813 Magnitude
residual = STS::magnitude(zero);
816 for (
int iter = 0;
iter < niters; ++
iter) {
818 q->update(one / norms[0], *z, zero);
820 if (diagInvVec != Teuchos::null)
821 z->elementWiseMultiply(one, *diagInvVec, *z, zero);
824 if (iter % 100 == 0 || iter + 1 == niters) {
825 r->update(1.0, *z, -lambda, *q, zero);
827 residual = STS::magnitude(norms[0] / lambda);
829 std::cout <<
"Iter = " <<
iter
830 <<
" Lambda = " << lambda
831 <<
" Residual of A*q - lambda*q = " << residual
835 if (residual < tolerance)
841 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
842 RCP<Teuchos::FancyOStream>
849 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
853 const size_t numVectors = v.size();
856 for (
size_t j = 0; j < numVectors; j++) {
857 d += (v[j][i0] - v[j][i1]) * (v[j][i0] - v[j][i1]);
862 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
866 const size_t numVectors = v.size();
870 for (
size_t j = 0; j < numVectors; j++) {
871 d += Teuchos::as<MT>(weight[j]) * (v[j][i0] - v[j][i1]) * (v[j][i0] - v[j][i1]);
876 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
883 if (count_twos_as_dirichlet) {
891 for (col = 0; col < nnz; col++)
892 if ((indices[col] != row) && STS::magnitude(vals[col]) > tol) {
893 if (!boundaryNodes[row])
895 boundaryNodes[row] =
false;
898 boundaryNodes[row] =
true;
908 for (
size_t col = 0; col < nnz; col++)
909 if ((indices[col] != row) && STS::magnitude(vals[col]) > tol) {
910 boundaryNodes[row] =
false;
915 return boundaryNodes;
918 template <
class SC,
class LO,
class GO,
class NO,
class memory_space>
919 Kokkos::View<bool*, memory_space>
922 const bool count_twos_as_dirichlet) {
923 using impl_scalar_type =
typename Kokkos::ArithTraits<SC>::val_type;
924 using ATS = Kokkos::ArithTraits<impl_scalar_type>;
925 using range_type = Kokkos::RangePolicy<LO, typename NO::execution_space>;
928 Kokkos::View<bool*, typename NO::device_type::memory_space> boundaryNodes;
930 if (helpers::isTpetraBlockCrs(A)) {
932 auto b_graph = Am.getCrsGraph().getLocalGraphDevice();
933 auto b_rowptr = Am.getCrsGraph().getLocalRowPtrsDevice();
938 boundaryNodes = Kokkos::View<bool*, typename NO::device_type::memory_space>(Kokkos::ViewAllocateWithoutInitializing(
"boundaryNodes"), numBlockRows);
940 if (count_twos_as_dirichlet)
943 Kokkos::parallel_for(
944 "MueLu:Utils::DetectDirichletRowsBlockCrs", range_type(0, numBlockRows),
945 KOKKOS_LAMBDA(
const LO row) {
946 auto rowView = b_graph.rowConst(row);
947 auto length = rowView.length;
948 LO valstart = b_rowptr[row] * stride;
950 boundaryNodes(row) =
true;
951 decltype(length) colID = 0;
952 for (; colID < length; colID++) {
953 if (rowView.colidx(colID) != row) {
954 LO current = valstart + colID * stride;
955 for (
LO k = 0; k < stride; k++) {
956 if (ATS::magnitude(values[current + k]) > tol) {
957 boundaryNodes(row) =
false;
962 if (boundaryNodes(row) ==
false)
967 auto localMatrix = A.getLocalMatrixDevice();
968 LO numRows = A.getLocalNumRows();
969 boundaryNodes = Kokkos::View<bool*, typename NO::device_type::memory_space>(Kokkos::ViewAllocateWithoutInitializing(
"boundaryNodes"), numRows);
971 if (count_twos_as_dirichlet)
972 Kokkos::parallel_for(
973 "MueLu:Utils::DetectDirichletRows_Twos_As_Dirichlet", range_type(0, numRows),
974 KOKKOS_LAMBDA(
const LO row) {
975 auto rowView = localMatrix.row(row);
976 auto length = rowView.length;
978 boundaryNodes(row) =
true;
980 decltype(length) colID = 0;
981 for (; colID < length; colID++)
982 if ((rowView.colidx(colID) != row) &&
983 (ATS::magnitude(rowView.value(colID)) > tol)) {
984 if (!boundaryNodes(row))
986 boundaryNodes(row) =
false;
989 boundaryNodes(row) =
true;
993 Kokkos::parallel_for(
994 "MueLu:Utils::DetectDirichletRows", range_type(0, numRows),
995 KOKKOS_LAMBDA(
const LO row) {
996 auto rowView = localMatrix.row(row);
997 auto length = rowView.length;
999 boundaryNodes(row) =
true;
1000 for (decltype(length) colID = 0; colID < length; colID++)
1001 if ((rowView.colidx(colID) != row) &&
1002 (ATS::magnitude(rowView.value(colID)) > tol)) {
1003 boundaryNodes(row) =
false;
1008 if constexpr (std::is_same<memory_space, typename NO::device_type::memory_space>::value)
1009 return boundaryNodes;
1011 Kokkos::View<bool*, memory_space> boundaryNodes2(Kokkos::ViewAllocateWithoutInitializing(
"boundaryNodes"), boundaryNodes.extent(0));
1012 Kokkos::deep_copy(boundaryNodes2, boundaryNodes);
1013 return boundaryNodes2;
1016 Kokkos::View<bool*, memory_space> dummy(
"dummy", 0);
1020 template <
class SC,
class LO,
class GO,
class NO>
1021 Kokkos::View<bool*, typename NO::device_type::memory_space>
1025 const bool count_twos_as_dirichlet) {
1026 return MueLu::DetectDirichletRows_kokkos<SC, LO, GO, NO, typename NO::device_type::memory_space>(A, tol, count_twos_as_dirichlet);
1029 template <
class SC,
class LO,
class GO,
class NO>
1030 Kokkos::View<bool*, typename Kokkos::HostSpace>
1034 const bool count_twos_as_dirichlet) {
1035 return MueLu::DetectDirichletRows_kokkos<SC, LO, GO, NO, typename Kokkos::HostSpace>(A, tol, count_twos_as_dirichlet);
1038 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1043 bHasZeroDiagonal =
false;
1057 bool bHasDiag =
false;
1058 for (decltype(indices.
size()) col = 0; col < indices.
size(); col++) {
1059 if (indices[col] != row) {
1060 if (STS::magnitude(vals[col] / STS::magnitude(sqrt(STS::magnitude(diagVecData[row]) * STS::magnitude(diagVecData[col])))) > tol) {
1066 if (bHasDiag ==
false)
1067 bHasZeroDiagonal =
true;
1069 boundaryNodes[row] =
true;
1071 return boundaryNodes;
1074 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1081 for (
size_t i = 0; i < static_cast<size_t>(vals.
size()); i++) {
1087 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1090 Kokkos::View<bool*, typename Node::device_type> nonzeros) {
1091 using ATS = Kokkos::ArithTraits<Scalar>;
1092 using impl_ATS = Kokkos::ArithTraits<typename ATS::val_type>;
1093 using range_type = Kokkos::RangePolicy<LocalOrdinal, typename Node::execution_space>;
1095 const typename ATS::magnitudeType eps = 2.0 * impl_ATS::eps();
1097 Kokkos::parallel_for(
1098 "MueLu:Maxwell1::FindNonZeros", range_type(0, vals.extent(0)),
1099 KOKKOS_LAMBDA(
const size_t i) {
1100 nonzeros(i) = (impl_ATS::magnitude(vals(i, 0)) > eps);
1104 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1114 TEUCHOS_ASSERT(static_cast<size_t>(dirichletRows.
size()) == rowMap->getLocalNumElements());
1115 TEUCHOS_ASSERT(static_cast<size_t>(dirichletCols.
size()) == colMap->getLocalNumElements());
1116 TEUCHOS_ASSERT(static_cast<size_t>(dirichletDomain.
size()) == domMap->getLocalNumElements());
1119 for (
size_t i = 0; i < (size_t)dirichletRows.
size(); i++) {
1120 if (dirichletRows[i]) {
1124 for (
size_t j = 0; j < static_cast<size_t>(indices.
size()); j++)
1125 myColsToZero->replaceLocalValue(indices[j], 0, one);
1134 globalColsToZero->doExport(*myColsToZero, *importer,
Xpetra::ADD);
1136 myColsToZero->doImport(*globalColsToZero, *importer,
Xpetra::INSERT);
1138 globalColsToZero = myColsToZero;
1140 FindNonZeros(globalColsToZero->getData(0), dirichletDomain);
1141 FindNonZeros(myColsToZero->getData(0), dirichletCols);
1144 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1147 const Kokkos::View<bool*, typename Node::device_type>& dirichletRows,
1148 Kokkos::View<bool*, typename Node::device_type> dirichletCols,
1149 Kokkos::View<bool*, typename Node::device_type> dirichletDomain) {
1150 using ATS = Kokkos::ArithTraits<Scalar>;
1151 using impl_ATS = Kokkos::ArithTraits<typename ATS::val_type>;
1152 using range_type = Kokkos::RangePolicy<LocalOrdinal, typename Node::execution_space>;
1156 TEUCHOS_ASSERT(dirichletRows.extent(0) == rowMap->getLocalNumElements());
1157 TEUCHOS_ASSERT(dirichletCols.extent(0) == colMap->getLocalNumElements());
1158 TEUCHOS_ASSERT(dirichletDomain.extent(0) == domMap->getLocalNumElements());
1161 auto myColsToZeroView = myColsToZero->getDeviceLocalView(Xpetra::Access::ReadWrite);
1162 auto localMatrix = A.getLocalMatrixDevice();
1163 Kokkos::parallel_for(
1164 "MueLu:Maxwell1::DetectDirichletCols", range_type(0, rowMap->getLocalNumElements()),
1166 if (dirichletRows(row)) {
1167 auto rowView = localMatrix.row(row);
1168 auto length = rowView.length;
1170 for (decltype(length) colID = 0; colID < length; colID++)
1171 myColsToZeroView(rowView.colidx(colID), 0) = impl_ATS::one();
1180 globalColsToZero->doExport(*myColsToZero, *importer,
Xpetra::ADD);
1182 myColsToZero->doImport(*globalColsToZero, *importer,
Xpetra::INSERT);
1184 globalColsToZero = myColsToZero;
1189 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1196 for (
LocalOrdinal row = 0; row < Teuchos::as<LocalOrdinal>(rowmap->getLocalNumElements()); ++row) {
1202 Scalar rowsum = STS::zero();
1203 Scalar diagval = STS::zero();
1205 for (
LocalOrdinal colID = 0; colID < Teuchos::as<LocalOrdinal>(nnz); colID++) {
1208 diagval = vals[colID];
1209 rowsum += vals[colID];
1212 if (rowSumTol < MTS::one() && STS::magnitude(rowsum) > STS::magnitude(diagval) * rowSumTol) {
1214 dirichletRows[row] =
true;
1219 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1225 RCP<const Xpetra::Map<LocalOrdinal, GlobalOrdinal, Node>> rowmap = A.getRowMap();
1227 TEUCHOS_TEST_FOR_EXCEPTION(!A.getColMap()->isSameAs(*BlockNumber.
getMap()), std::runtime_error,
"ApplyRowSumCriterion: BlockNumber must match's A's column map.");
1230 for (
LocalOrdinal row = 0; row < Teuchos::as<LocalOrdinal>(rowmap->getLocalNumElements()); ++row) {
1232 ArrayView<const LocalOrdinal> indices;
1233 ArrayView<const Scalar> vals;
1236 Scalar rowsum = STS::zero();
1237 Scalar diagval = STS::zero();
1238 for (
LocalOrdinal colID = 0; colID < Teuchos::as<LocalOrdinal>(nnz); colID++) {
1241 diagval = vals[colID];
1242 if (block_id[row] == block_id[col])
1243 rowsum += vals[colID];
1247 if (rowSumTol < MTS::one() && STS::magnitude(rowsum) > STS::magnitude(diagval) * rowSumTol) {
1249 dirichletRows[row] =
true;
1255 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node,
class memory_space>
1258 Kokkos::View<bool*, memory_space>& dirichletRows) {
1262 auto dirichletRowsHost = Kokkos::create_mirror_view(dirichletRows);
1263 Kokkos::deep_copy(dirichletRowsHost, dirichletRows);
1265 for (
LocalOrdinal row = 0; row < Teuchos::as<LocalOrdinal>(rowmap->getLocalNumElements()); ++row) {
1271 Scalar rowsum = STS::zero();
1272 Scalar diagval = STS::zero();
1273 for (
LocalOrdinal colID = 0; colID < Teuchos::as<LocalOrdinal>(nnz); colID++) {
1276 diagval = vals[colID];
1277 rowsum += vals[colID];
1279 if (STS::real(rowsum) > STS::magnitude(diagval) * rowSumTol)
1280 dirichletRowsHost(row) =
true;
1283 Kokkos::deep_copy(dirichletRows, dirichletRowsHost);
1286 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1290 Kokkos::View<bool*, typename Node::device_type::memory_space>& dirichletRows) {
1291 MueLu::ApplyRowSumCriterion<Scalar, LocalOrdinal, GlobalOrdinal, Node, typename Node::device_type::memory_space>(A, rowSumTol, dirichletRows);
1294 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1298 Kokkos::View<bool*, Kokkos::HostSpace>& dirichletRows) {
1299 MueLu::ApplyRowSumCriterion<Scalar, LocalOrdinal, GlobalOrdinal, Node, Kokkos::HostSpace>(A, rowSumTol, dirichletRows);
1303 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node,
class memory_space>
1307 Kokkos::View<bool*, memory_space>& dirichletRows) {
1311 TEUCHOS_TEST_FOR_EXCEPTION(!A.getColMap()->isSameAs(*BlockNumber.
getMap()), std::runtime_error,
"ApplyRowSumCriterion: BlockNumber must match's A's column map.");
1313 auto dirichletRowsHost = Kokkos::create_mirror_view(dirichletRows);
1314 Kokkos::deep_copy(dirichletRowsHost, dirichletRows);
1317 for (
LocalOrdinal row = 0; row < Teuchos::as<LocalOrdinal>(rowmap->getLocalNumElements()); ++row) {
1323 Scalar rowsum = STS::zero();
1324 Scalar diagval = STS::zero();
1325 for (
LocalOrdinal colID = 0; colID < Teuchos::as<LocalOrdinal>(nnz); colID++) {
1328 diagval = vals[colID];
1329 if (block_id[row] == block_id[col])
1330 rowsum += vals[colID];
1332 if (STS::real(rowsum) > STS::magnitude(diagval) * rowSumTol)
1333 dirichletRowsHost(row) =
true;
1336 Kokkos::deep_copy(dirichletRows, dirichletRowsHost);
1339 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1344 Kokkos::View<bool*, typename Node::device_type::memory_space>& dirichletRows) {
1345 MueLu::ApplyRowSumCriterion<Scalar, LocalOrdinal, GlobalOrdinal, Node, typename Node::device_type::memory_space>(A, BlockNumber, rowSumTol, dirichletRows);
1348 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1353 Kokkos::View<bool*, Kokkos::HostSpace>& dirichletRows) {
1354 MueLu::ApplyRowSumCriterion<Scalar, LocalOrdinal, GlobalOrdinal, Node, Kokkos::HostSpace>(A, BlockNumber, rowSumTol, dirichletRows);
1357 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1367 myColsToZero->putScalar(zero);
1369 for (
size_t i = 0; i < (size_t)dirichletRows.
size(); i++) {
1370 if (dirichletRows[i]) {
1374 for (
size_t j = 0; j < static_cast<size_t>(indices.
size()); j++)
1375 myColsToZero->replaceLocalValue(indices[j], 0, one);
1380 globalColsToZero->putScalar(zero);
1383 globalColsToZero->doExport(*myColsToZero, *exporter,
Xpetra::ADD);
1385 myColsToZero->doImport(*globalColsToZero, *exporter,
Xpetra::INSERT);
1389 for (
size_t i = 0; i < colMap->getLocalNumElements(); i++) {
1392 return dirichletCols;
1395 template <
class SC,
class LO,
class GO,
class NO>
1396 Kokkos::View<bool*, typename NO::device_type>
1399 const Kokkos::View<const bool*, typename NO::device_type>& dirichletRows) {
1400 using ATS = Kokkos::ArithTraits<SC>;
1401 using impl_ATS = Kokkos::ArithTraits<typename ATS::val_type>;
1402 using range_type = Kokkos::RangePolicy<LO, typename NO::execution_space>;
1404 SC zero = ATS::zero();
1406 auto localMatrix = A.getLocalMatrixDevice();
1407 LO numRows = A.getLocalNumRows();
1412 myColsToZero->putScalar(zero);
1413 auto myColsToZeroView = myColsToZero->getDeviceLocalView(Xpetra::Access::ReadWrite);
1415 Kokkos::parallel_for(
1416 "MueLu:Utils::DetectDirichletCols1", range_type(0, numRows),
1417 KOKKOS_LAMBDA(
const LO row) {
1418 if (dirichletRows(row)) {
1419 auto rowView = localMatrix.row(row);
1420 auto length = rowView.length;
1422 for (decltype(length) colID = 0; colID < length; colID++)
1423 myColsToZeroView(rowView.colidx(colID), 0) = impl_ATS::one();
1428 globalColsToZero->putScalar(zero);
1431 globalColsToZero->doExport(*myColsToZero, *exporter,
Xpetra::ADD);
1433 myColsToZero->doImport(*globalColsToZero, *exporter,
Xpetra::INSERT);
1435 auto myCols = myColsToZero->getDeviceLocalView(Xpetra::Access::ReadOnly);
1436 size_t numColEntries = colMap->getLocalNumElements();
1437 Kokkos::View<bool*, typename NO::device_type> dirichletCols(Kokkos::ViewAllocateWithoutInitializing(
"dirichletCols"), numColEntries);
1438 const typename ATS::magnitudeType eps = 2.0 * ATS::eps();
1440 Kokkos::parallel_for(
1441 "MueLu:Utils::DetectDirichletCols2", range_type(0, numColEntries),
1442 KOKKOS_LAMBDA(
const size_t i) {
1443 dirichletCols(i) = impl_ATS::magnitude(myCols(i, 0)) > eps;
1445 return dirichletCols;
1448 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1459 const Map& AColMap = *A.getColMap();
1460 const Map& BColMap = *B.getColMap();
1464 size_t nnzA = 0, nnzB = 0;
1480 size_t numRows = A.getLocalNumRows();
1481 for (
size_t i = 0; i < numRows; i++) {
1488 for (
size_t j = 0; j < nnzB; j++)
1489 valBAll[indB[j]] = valB[j];
1491 for (
size_t j = 0; j < nnzA; j++) {
1494 LocalOrdinal ind = BColMap.getLocalElement(AColMap.getGlobalElement(indA[j]));
1496 f += valBAll[ind] * valA[j];
1500 for (
size_t j = 0; j < nnzB; j++)
1501 valBAll[indB[j]] = zero;
1509 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1517 int maxint = INT_MAX;
1518 int mySeed = Teuchos::as<int>((maxint - 1) * (one - (comm.
getRank() + 1) / (comm.
getSize() + one)));
1519 if (mySeed < 1 || mySeed == maxint) {
1520 std::ostringstream errStr;
1521 errStr <<
"Error detected with random seed = " << mySeed <<
". It should be in the interval [1,2^31-2].";
1533 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1536 std::vector<LocalOrdinal>& dirichletRows,
bool count_twos_as_dirichlet) {
1538 dirichletRows.resize(0);
1539 for (
size_t i = 0; i < A->getLocalNumRows(); i++) {
1544 for (
size_t j = 0; j < (size_t)indices.
size(); j++) {
1549 if (nnz == 1 || (count_twos_as_dirichlet && nnz == 2)) {
1550 dirichletRows.push_back(i);
1555 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1558 const std::vector<LocalOrdinal>& dirichletRows) {
1564 for (
size_t i = 0; i < dirichletRows.size(); i++) {
1565 GlobalOrdinal row_gid = Rmap->getGlobalElement(dirichletRows[i]);
1572 for (
size_t j = 0; j < (size_t)indices.
size(); j++) {
1573 if (Cmap->getGlobalElement(indices[j]) == row_gid)
1581 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1590 TEUCHOS_ASSERT(static_cast<size_t>(dirichletRows.
size()) == Rmap->getLocalNumElements());
1594 for (
size_t i = 0; i < (size_t)dirichletRows.
size(); i++) {
1595 if (dirichletRows[i]) {
1603 for (
size_t j = 0; j < (size_t)indices.
size(); j++) {
1604 if (Cmap->getGlobalElement(indices[j]) == row_gid)
1615 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1618 const Kokkos::View<const bool*, typename Node::device_type>& dirichletRows) {
1620 using ATS = Kokkos::ArithTraits<Scalar>;
1621 using impl_ATS = Kokkos::ArithTraits<typename ATS::val_type>;
1622 using range_type = Kokkos::RangePolicy<LocalOrdinal, typename Node::execution_space>;
1629 TEUCHOS_ASSERT(static_cast<size_t>(dirichletRows.size()) == Rmap->getLocalNumElements());
1631 auto localMatrix = A->getLocalMatrixDevice();
1632 auto localRmap = Rmap->getLocalMap();
1633 auto localCmap = Cmap->getLocalMap();
1635 Kokkos::parallel_for(
1636 "MueLu::Utils::ApplyOAZ", range_type(0, dirichletRows.extent(0)),
1638 if (dirichletRows(row)) {
1639 auto rowView = localMatrix.row(row);
1640 auto length = rowView.length;
1641 auto row_gid = localRmap.getGlobalElement(row);
1642 auto row_lid = localCmap.getLocalElement(row_gid);
1644 for (decltype(length) colID = 0; colID < length; colID++)
1645 if (rowView.colidx(colID) == row_lid)
1646 rowView.value(colID) = impl_ATS::one();
1648 rowView.value(colID) = impl_ATS::zero();
1653 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1656 const std::vector<LocalOrdinal>& dirichletRows,
1658 for (
size_t i = 0; i < dirichletRows.size(); i++) {
1664 for (
size_t j = 0; j < (size_t)indices.
size(); j++)
1665 valuesNC[j] = replaceWith;
1669 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1674 TEUCHOS_ASSERT(static_cast<size_t>(dirichletRows.
size()) == A->getRowMap()->getLocalNumElements());
1675 for (
size_t i = 0; i < (size_t)dirichletRows.
size(); i++) {
1676 if (dirichletRows[i]) {
1682 for (
size_t j = 0; j < (size_t)indices.
size(); j++)
1683 valuesNC[j] = replaceWith;
1688 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1693 TEUCHOS_ASSERT(static_cast<size_t>(dirichletRows.
size()) == X->getMap()->getLocalNumElements());
1694 for (
size_t i = 0; i < (size_t)dirichletRows.
size(); i++) {
1695 if (dirichletRows[i]) {
1696 for (
size_t j = 0; j < X->getNumVectors(); j++)
1697 X->replaceLocalValue(i, j, replaceWith);
1702 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1705 const Kokkos::View<const bool*, typename Node::device_type>& dirichletRows,
1707 using ATS = Kokkos::ArithTraits<Scalar>;
1708 using range_type = Kokkos::RangePolicy<LocalOrdinal, typename Node::execution_space>;
1710 typename ATS::val_type impl_replaceWith = replaceWith;
1712 auto localMatrix = A->getLocalMatrixDevice();
1715 Kokkos::parallel_for(
1716 "MueLu:Utils::ZeroDirichletRows", range_type(0, numRows),
1718 if (dirichletRows(row)) {
1719 auto rowView = localMatrix.row(row);
1720 auto length = rowView.length;
1721 for (decltype(length) colID = 0; colID < length; colID++)
1722 rowView.value(colID) = impl_replaceWith;
1727 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1730 const Kokkos::View<const bool*, typename Node::device_type>& dirichletRows,
1732 using ATS = Kokkos::ArithTraits<Scalar>;
1733 using range_type = Kokkos::RangePolicy<LocalOrdinal, typename Node::execution_space>;
1735 typename ATS::val_type impl_replaceWith = replaceWith;
1737 auto myCols = X->getDeviceLocalView(Xpetra::Access::ReadWrite);
1738 size_t numVecs = X->getNumVectors();
1739 Kokkos::parallel_for(
1740 "MueLu:Utils::ZeroDirichletRows_MV", range_type(0, dirichletRows.size()),
1741 KOKKOS_LAMBDA(
const size_t i) {
1742 if (dirichletRows(i)) {
1743 for (
size_t j = 0; j < numVecs; j++)
1744 myCols(i, j) = impl_replaceWith;
1749 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1754 TEUCHOS_ASSERT(static_cast<size_t>(dirichletCols.
size()) == A->getColMap()->getLocalNumElements());
1755 for (
size_t i = 0; i < A->getLocalNumRows(); i++) {
1758 A->getLocalRowView(i, indices, values);
1761 for (
size_t j = 0; j < static_cast<size_t>(indices.
size()); j++)
1762 if (dirichletCols[indices[j]])
1763 valuesNC[j] = replaceWith;
1767 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1770 const Kokkos::View<const bool*, typename Node::device_type>& dirichletCols,
1772 using ATS = Kokkos::ArithTraits<Scalar>;
1773 using range_type = Kokkos::RangePolicy<LocalOrdinal, typename Node::execution_space>;
1775 typename ATS::val_type impl_replaceWith = replaceWith;
1777 auto localMatrix = A->getLocalMatrixDevice();
1780 Kokkos::parallel_for(
1781 "MueLu:Utils::ZeroDirichletCols", range_type(0, numRows),
1783 auto rowView = localMatrix.row(row);
1784 auto length = rowView.length;
1785 for (decltype(length) colID = 0; colID < length; colID++)
1786 if (dirichletCols(rowView.colidx(colID))) {
1787 rowView.value(colID) = impl_replaceWith;
1792 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1799 throw std::runtime_error(
"UtilitiesBase::FindDirichletRowsAndPropagateToCols row and domain maps must match.");
1802 bool has_import = !importer.
is_null();
1805 std::vector<LocalOrdinal> dirichletRows;
1806 FindDirichletRows(A, dirichletRows);
1809 printf(
"[%d] DirichletRow Ids = ",A->getRowMap()->getComm()->getRank());
1810 for(
size_t i=0; i<(size_t) dirichletRows.size(); i++)
1811 printf(
"%d ",dirichletRows[i]);
1824 for (
size_t i = 0; i < (size_t)dirichletRows.size(); i++) {
1825 dr[dirichletRows[i]] = 1;
1826 if (!has_import) dc[dirichletRows[i]] = 1;
1831 isDirichletCol->doImport(*isDirichletRow, *importer, Xpetra::CombineMode::ADD);
1834 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1838 using ISC =
typename Kokkos::ArithTraits<Scalar>::val_type;
1839 using range_type = Kokkos::RangePolicy<LocalOrdinal, typename Node::execution_space>;
1840 using local_matrix_type =
typename CrsMatrix::local_matrix_type;
1841 using values_type =
typename local_matrix_type::values_type;
1843 const ISC ONE = Kokkos::ArithTraits<ISC>::one();
1844 const ISC
ZERO = Kokkos::ArithTraits<ISC>::zero();
1847 auto localMatrix = original->getLocalMatrixDevice();
1849 values_type new_values(
"values", localMatrix.nnz());
1851 Kokkos::parallel_for(
1852 "ReplaceNonZerosWithOnes", range_type(0, localMatrix.nnz()), KOKKOS_LAMBDA(
const size_t i) {
1853 if (localMatrix.values(i) != ZERO)
1854 new_values(i) = ONE;
1856 new_values(i) = ZERO;
1862 NewMatrix->fillComplete(original->getDomainMap(), original->getRangeMap());
1866 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1877 if (!stridedMap.
is_null()) fullMap = stridedMap->getMap();
1880 const size_t numSubMaps = sourceBlockedMap.
getNumMaps();
1882 throw std::runtime_error(
"GenerateBlockedTargetMap(): Map compatibility error");
1887 for (
size_t i = 0; i < numSubMaps; i++) {
1890 for (
size_t j = 0; j < map->getLocalNumElements(); j++) {
1891 LocalOrdinal jj = fullMap->getLocalElement(map->getGlobalElement(j));
1892 block_ids->replaceLocalValue(jj, (
int)i);
1899 new_block_ids->doImport(*block_ids, Importer, Xpetra::CombineMode::ADD);
1905 for (
size_t i = 0; i < targetMap->getLocalNumElements(); i++) {
1906 elementsInSubMap[data[i]].
push_back(targetMap->getGlobalElement(i));
1910 std::vector<RCP<const Map>> subMaps(numSubMaps);
1911 for (
size_t i = 0; i < numSubMaps; i++) {
1916 return rcp(
new BlockedMap(targetMap, subMaps));
1919 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1925 const size_t numElements = rowElements.
size();
1927 if (
size_t(colElements.
size()) < numElements)
1930 bool goodMap =
true;
1931 for (
size_t i = 0; i < numElements; i++)
1932 if (rowElements[i] != colElements[i]) {
1940 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1945 using local_graph_type =
typename local_matrix_type::staticcrsgraph_type;
1946 using lno_nnz_view_t =
typename local_graph_type::entries_type::non_const_type;
1947 using device =
typename local_graph_type::device_type;
1948 using execution_space =
typename local_matrix_type::execution_space;
1949 using ordinal_type =
typename local_matrix_type::ordinal_type;
1951 local_graph_type localGraph = Op.getLocalMatrixDevice().graph;
1953 lno_nnz_view_t rcmOrder = KokkosGraph::Experimental::graph_rcm<device, typename local_graph_type::row_map_type, typename local_graph_type::entries_type, lno_nnz_view_t>(localGraph.row_map, localGraph.entries);
1959 auto view1D = Kokkos::subview(retval->getDeviceLocalView(Xpetra::Access::ReadWrite), Kokkos::ALL(), 0);
1960 Kokkos::parallel_for(
1961 "Utilities::ReverseCuthillMcKee",
1962 Kokkos::RangePolicy<ordinal_type, execution_space>(0, localGraph.numRows()),
1963 KOKKOS_LAMBDA(
const ordinal_type rowIdx) {
1964 view1D(rcmOrder(rowIdx)) = rowIdx;
1969 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1974 using local_graph_type =
typename local_matrix_type::staticcrsgraph_type;
1975 using lno_nnz_view_t =
typename local_graph_type::entries_type::non_const_type;
1976 using device =
typename local_graph_type::device_type;
1977 using execution_space =
typename local_matrix_type::execution_space;
1978 using ordinal_type =
typename local_matrix_type::ordinal_type;
1980 local_graph_type localGraph = Op.getLocalMatrixDevice().graph;
1983 lno_nnz_view_t rcmOrder = KokkosGraph::Experimental::graph_rcm<device, typename local_graph_type::row_map_type, typename local_graph_type::entries_type, lno_nnz_view_t>(localGraph.row_map, localGraph.entries);
1989 auto view1D = Kokkos::subview(retval->getDeviceLocalView(Xpetra::Access::ReadWrite), Kokkos::ALL(), 0);
1991 Kokkos::parallel_for(
1992 "Utilities::ReverseCuthillMcKee",
1993 Kokkos::RangePolicy<ordinal_type, execution_space>(0, numRows),
1994 KOKKOS_LAMBDA(
const ordinal_type rowIdx) {
1995 view1D(rcmOrder(numRows - 1 - rowIdx)) = rowIdx;
2002 #define MUELU_UTILITIESBASE_SHORT
2003 #endif // MUELU_UTILITIESBASE_DEF_HPP
static void FindNonZeros(const Teuchos::ArrayRCP< const Scalar > vals, Teuchos::ArrayRCP< bool > nonzeros)
Find non-zero values in an ArrayRCP Compares the value to 2 * machine epsilon.
static RCP< Export< LocalOrdinal, GlobalOrdinal, Node > > Build(const RCP< const Map< LocalOrdinal, GlobalOrdinal, Node > > &source, const RCP< const Map< LocalOrdinal, GlobalOrdinal, Node > > &target)
static RCP< Vector > GetMatrixDiagonal(const Matrix &A)
Extract Matrix Diagonal.
static void ApplyOAZToMatrixRows(Teuchos::RCP< Xpetra::Matrix< Scalar, LocalOrdinal, GlobalOrdinal, Node >> &A, const std::vector< LocalOrdinal > &dirichletRows)
static void ZeroDirichletCols(Teuchos::RCP< Matrix > &A, const Teuchos::ArrayRCP< const bool > &dirichletCols, Scalar replaceWith=Teuchos::ScalarTraits< Scalar >::zero())
static void DetectDirichletColsAndDomains(const Xpetra::Matrix< Scalar, LocalOrdinal, GlobalOrdinal, Node > &A, const Teuchos::ArrayRCP< bool > &dirichletRows, Teuchos::ArrayRCP< bool > dirichletCols, Teuchos::ArrayRCP< bool > dirichletDomain)
Detects Dirichlet columns & domains from a list of Dirichlet rows.
#define MueLu_sumAll(rcpComm, in, out)
static RCP< CrsMatrixWrap > GetThresholdedMatrix(const RCP< Matrix > &Ain, const Scalar threshold, const bool keepDiagonal=true, const GlobalOrdinal expectedNNZperRow=-1)
Threshold a matrix.
Array< T > & append(const T &x)
virtual int getSize() const =0
MueLu::DefaultLocalOrdinal LocalOrdinal
void ApplyRowSumCriterion(const Xpetra::Matrix< Scalar, LocalOrdinal, GlobalOrdinal, Node > &A, const typename Teuchos::ScalarTraits< Scalar >::magnitudeType rowSumTol, Kokkos::View< bool *, memory_space > &dirichletRows)
virtual LO getBlockSize() const override
static bool MapsAreNested(const Xpetra::Map< LocalOrdinal, GlobalOrdinal, Node > &rowMap, const Xpetra::Map< LocalOrdinal, GlobalOrdinal, Node > &colMap)
static RCP< Xpetra::Vector< LocalOrdinal, LocalOrdinal, GlobalOrdinal, Node > > ReverseCuthillMcKee(const Matrix &Op)
static void FindDirichletRowsAndPropagateToCols(Teuchos::RCP< Xpetra::Matrix< Scalar, LocalOrdinal, GlobalOrdinal, Node >> &A, Teuchos::RCP< Xpetra::Vector< int, LocalOrdinal, GlobalOrdinal, Node >> &isDirichletRow, Teuchos::RCP< Xpetra::Vector< int, LocalOrdinal, GlobalOrdinal, Node >> &isDirichletCol)
virtual int getRank() const =0
static void ApplyRowSumCriterionHost(const Matrix &A, const typename Teuchos::ScalarTraits< Scalar >::magnitudeType rowSumTol, Kokkos::View< bool *, Kokkos::HostSpace > &dirichletRows)
static Teuchos::RCP< MultiVector< Scalar, LocalOrdinal, GlobalOrdinal, Node > > Build(const Teuchos::RCP< const Map< LocalOrdinal, GlobalOrdinal, Node >> &map, size_t NumVectors, bool zeroOut=true)
static magnitudeType eps()
static Scalar PowerMethod(const Matrix &A, bool scaleByDiag=true, LocalOrdinal niters=10, Magnitude tolerance=1e-2, bool verbose=false, unsigned int seed=123)
Power method.
static void ApplyRowSumCriterion(const Xpetra::Matrix< Scalar, LocalOrdinal, GlobalOrdinal, Node > &A, const Magnitude rowSumTol, Teuchos::ArrayRCP< bool > &dirichletRows)
Apply Rowsum Criterion.
#define TEUCHOS_TEST_FOR_EXCEPTION(throw_exception_test, Exception, msg)
static RCP< Vector > GetMatrixOverlappedDeletedRowsum(const Matrix &A)
Extract Overlapped Matrix Deleted Rowsum.
static RCP< Xpetra::CrsGraph< LocalOrdinal, GlobalOrdinal, Node > > GetThresholdedGraph(const RCP< Matrix > &A, const Magnitude threshold, const GlobalOrdinal expectedNNZperRow=-1)
Threshold a graph.
virtual void resumeFill(const RCP< ParameterList > ¶ms=null)=0
static void ZeroDirichletRows(Teuchos::RCP< Xpetra::Matrix< Scalar, LocalOrdinal, GlobalOrdinal, Node >> &A, const std::vector< LocalOrdinal > &dirichletRows, Scalar replaceWith=Teuchos::ScalarTraits< Scalar >::zero())
static RCP< Xpetra::Matrix< Scalar, LocalOrdinal, GlobalOrdinal, Node > > ReplaceNonZerosWithOnes(const RCP< Matrix > &original)
Creates a copy of a matrix where the non-zero entries are replaced by ones.
size_t getLocalNumRows() const override
Exception throws to report incompatible objects (like maps).
static void SetRandomSeed(const Teuchos::Comm< int > &comm)
Set seed for random number generator.
static RCP< Xpetra::Vector< LocalOrdinal, LocalOrdinal, GlobalOrdinal, Node > > CuthillMcKee(const Matrix &Op)
static Teuchos::ArrayRCP< Magnitude > GetMatrixMaxMinusOffDiagonal(const Xpetra::Matrix< Scalar, LocalOrdinal, GlobalOrdinal, Node > &A)
Return vector containing: max_{i=k}(-a_ik), for each for i in the matrix.
virtual Teuchos::RCP< const Map< LocalOrdinal, GlobalOrdinal, Node > > getTargetMap() const =0
static RCP< Time > getNewTimer(const std::string &name)
void resize(const size_type n, const T &val=T())
virtual void fillComplete(const RCP< const Map > &domainMap, const RCP< const Map > &rangeMap, const RCP< ParameterList > ¶ms=null)=0
virtual void getLocalDiagCopy(Vector< Scalar, LocalOrdinal, GlobalOrdinal, Node > &diag) const =0
static RCP< MultiVector > Residual(const Xpetra::Operator< Scalar, LocalOrdinal, GlobalOrdinal, Node > &Op, const MultiVector &X, const MultiVector &RHS)
static Teuchos::ArrayRCP< const bool > DetectDirichletCols(const Xpetra::Matrix< Scalar, LocalOrdinal, GlobalOrdinal, Node > &A, const Teuchos::ArrayRCP< const bool > &dirichletRows)
Detect Dirichlet columns based on Dirichlet rows.
virtual void getLocalRowView(LocalOrdinal LocalRow, ArrayView< const LocalOrdinal > &indices, ArrayView< const Scalar > &values) const =0
static void FindDirichletRows(Teuchos::RCP< Xpetra::Matrix< Scalar, LocalOrdinal, GlobalOrdinal, Node >> &A, std::vector< LocalOrdinal > &dirichletRows, bool count_twos_as_dirichlet=false)
TEUCHOS_DEPRECATED RCP< T > rcp(T *p, Dealloc_T dealloc, bool owns_mem)
MueLu::DefaultScalar Scalar
Kokkos::View< bool *, memory_space > DetectDirichletRows_kokkos(const Xpetra::Matrix< SC, LO, GO, NO > &A, const typename Teuchos::ScalarTraits< SC >::magnitudeType &tol, const bool count_twos_as_dirichlet)
MueLu::DefaultGlobalOrdinal GlobalOrdinal
static Teuchos::RCP< Map< LocalOrdinal, GlobalOrdinal, Node > > Build(UnderlyingLib lib, global_size_t numGlobalElements, GlobalOrdinal indexBase, const Teuchos::RCP< const Teuchos::Comm< int >> &comm, LocalGlobal lg=Xpetra::GloballyDistributed)
static Teuchos::ArrayRCP< const bool > DetectDirichletRows(const Xpetra::Matrix< Scalar, LocalOrdinal, GlobalOrdinal, Node > &A, const Magnitude &tol=Teuchos::ScalarTraits< Magnitude >::zero(), bool count_twos_as_dirichlet=false)
Detect Dirichlet rows.
virtual bool isFillComplete() const =0
static RCP< Xpetra::Vector< Magnitude, LocalOrdinal, GlobalOrdinal, Node > > GetMatrixOverlappedAbsDeletedRowsum(const Matrix &A)
size_t getNumMaps() const
virtual void replaceLocalValues(LocalOrdinal localRow, const ArrayView< const LocalOrdinal > &cols, const ArrayView< const Scalar > &vals)=0
static Teuchos::ArrayRCP< Scalar > GetMatrixDiagonal_arcp(const Matrix &A)
Extract Matrix Diagonal.
virtual Teuchos::RCP< const Map< LocalOrdinal, GlobalOrdinal, Node > > getMap() const =0
static RCP< const Xpetra::BlockedMap< LocalOrdinal, GlobalOrdinal, Node > > GeneratedBlockedTargetMap(const Xpetra::BlockedMap< LocalOrdinal, GlobalOrdinal, Node > &sourceBlockedMap, const Xpetra::Import< LocalOrdinal, GlobalOrdinal, Node > &Importer)
static RCP< Vector > GetMatrixOverlappedDiagonal(const Matrix &A)
Extract Overlapped Matrix Diagonal.
Teuchos::ScalarTraits< Scalar >::magnitudeType Magnitude
virtual size_t getNumEntriesInLocalRow(LocalOrdinal localRow) const =0
static RCP< Vector > GetMatrixDiagonalInverse(const Matrix &A, Magnitude tol=Teuchos::ScalarTraits< Scalar >::eps()*100, Scalar valReplacement=Teuchos::ScalarTraits< Scalar >::zero(), const bool doLumped=false)
Extract Matrix Diagonal.
static void seedrandom(unsigned int s)
static Teuchos::ArrayRCP< const bool > DetectDirichletRowsExt(const Xpetra::Matrix< Scalar, LocalOrdinal, GlobalOrdinal, Node > &A, bool &bHasZeroDiagonal, const Magnitude &tol=Teuchos::ScalarTraits< Scalar >::zero())
Detect Dirichlet rows (extended version)
static RCP< Vector > Build(const Teuchos::RCP< const Map > &map, bool zeroOut=true)
const RCP< const Xpetra::Map< LocalOrdinal, GlobalOrdinal, Node > > getMap(size_t i, bool bThyraMode=false) const
virtual UnderlyingLib lib() const
static magnitudeType magnitude(T a)
void push_back(const value_type &x)
virtual RCP< const CrsGraph > getCrsGraph() const =0
static Teuchos::Array< Magnitude > ResidualNorm(const Xpetra::Operator< Scalar, LocalOrdinal, GlobalOrdinal, Node > &Op, const MultiVector &X, const MultiVector &RHS)
impl_scalar_type_dualview::t_dev::const_type getValuesDevice(const LO &lclRow) const
virtual Teuchos::RCP< const Map > getRangeMap() const =0
static RCP< Teuchos::FancyOStream > MakeFancy(std::ostream &os)
static RCP< Matrix > Build(const RCP< const Map > &rowMap, size_t maxNumEntriesPerRow, Xpetra::ProfileType pftype=Xpetra::DynamicProfile)
void residual(const Operator< SC, LO, GO, NO > &Aop, const MultiVector< SC, LO, GO, NO > &X_in, const MultiVector< SC, LO, GO, NO > &B_in, MultiVector< SC, LO, GO, NO > &R_in)
Exception throws to report errors in the internal logical of the program.
static Scalar Frobenius(const Xpetra::Matrix< Scalar, LocalOrdinal, GlobalOrdinal, Node > &A, const Xpetra::Matrix< Scalar, LocalOrdinal, GlobalOrdinal, Node > &B)
Frobenius inner product of two matrices.
virtual Teuchos::RCP< const Map< LocalOrdinal, GlobalOrdinal, Node > > getSourceMap() const =0
#define TEUCHOS_ASSERT(assertion_test)
static Teuchos::RCP< Vector > GetInverse(Teuchos::RCP< const Vector > v, Magnitude tol=Teuchos::ScalarTraits< Scalar >::eps()*100, Scalar valReplacement=Teuchos::ScalarTraits< Scalar >::zero())
Return vector containing inverse of input vector.
static Kokkos::View< bool *, typename Kokkos::HostSpace > DetectDirichletRows_kokkos_host(const Matrix &A, const Magnitude &tol=Teuchos::ScalarTraits< typename Teuchos::ScalarTraits< SC >::magnitudeType >::zero(), const bool count_twos_as_dirichlet=false)
static Teuchos::ScalarTraits< Scalar >::magnitudeType Distance2(const Teuchos::Array< Teuchos::ArrayRCP< const Scalar >> &v, LocalOrdinal i0, LocalOrdinal i1)
Squared distance between two rows in a multivector.
static Teuchos::RCP< Vector > GetLumpedMatrixDiagonal(Matrix const &A, const bool doReciprocal=false, Magnitude tol=Teuchos::ScalarTraits< Scalar >::magnitude(Teuchos::ScalarTraits< Scalar >::zero()), Scalar valReplacement=Teuchos::ScalarTraits< Scalar >::zero(), const bool replaceSingleEntryRowWithZero=false, const bool useAverageAbsDiagVal=false)
Extract Matrix Diagonal of lumped matrix.
static Kokkos::View< bool *, typename NO::device_type::memory_space > DetectDirichletRows_kokkos(const Matrix &A, const Magnitude &tol=Teuchos::ScalarTraits< typename Teuchos::ScalarTraits< SC >::magnitudeType >::zero(), const bool count_twos_as_dirichlet=false)
Detect Dirichlet rows.
static RCP< Matrix > Crs2Op(RCP< CrsMatrix > Op)
virtual Teuchos::ArrayRCP< const Scalar > getData(size_t j) const =0
virtual Teuchos::RCP< const Map > getDomainMap() const =0
static RCP< Import< LocalOrdinal, GlobalOrdinal, Node > > Build(const RCP< const Map< LocalOrdinal, GlobalOrdinal, Node > > &source, const RCP< const Map< LocalOrdinal, GlobalOrdinal, Node > > &target, const Teuchos::RCP< Teuchos::ParameterList > &plist=Teuchos::null)