46 #ifndef MUELU_RAPFACTORY_DEF_HPP
47 #define MUELU_RAPFACTORY_DEF_HPP
64 #include "MueLu_PerfUtils.hpp"
70 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
72 : hasDeclaredInput_(false) { }
74 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
78 #define SET_VALID_ENTRY(name) validParamList->setEntry(name, MasterList::getEntry(name))
83 #undef SET_VALID_ENTRY
84 validParamList->
set<
RCP<const FactoryBase> >(
"A", null,
"Generating factory of the matrix A used during the prolongator smoothing process");
88 validParamList->
set<
bool > (
"CheckMainDiagonal",
false,
"Check main diagonal for zeros");
89 validParamList->
set<
bool > (
"RepairMainDiagonal",
false,
"Repair zeros on main diagonal");
94 validParamList->
set<
ParameterList> (
"matrixmatrix: kernel params", norecurse,
"MatrixMatrix kernel parameters");
96 return validParamList;
99 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
102 if (pL.
get<
bool>(
"transpose: use implicit") ==
false)
103 Input(coarseLevel,
"R");
105 Input(fineLevel,
"A");
106 Input(coarseLevel,
"P");
109 for (std::vector<
RCP<const FactoryBase> >::const_iterator it = transferFacts_.begin(); it != transferFacts_.end(); ++it)
110 (*it)->CallDeclareInput(coarseLevel);
112 hasDeclaredInput_ =
true;
115 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
117 const bool doTranspose =
true;
118 const bool doFillComplete =
true;
119 const bool doOptimizeStorage =
true;
122 std::ostringstream levelstr;
127 "MueLu::RAPFactory::Build(): CallDeclareInput has not been called before Build!");
130 RCP<Matrix> A = Get< RCP<Matrix> >(fineLevel,
"A");
131 RCP<Matrix> P = Get< RCP<Matrix> >(coarseLevel,
"P"), AP, Ac;
134 #ifdef KOKKOS_ENABLE_CUDA
135 bool isCuda =
typeid(
Node).name() ==
typeid(Kokkos::Compat::KokkosCudaWrapperNode).name();
140 if (pL.
get<
bool>(
"rap: triple product") ==
false || isEpetra || isCuda) {
141 if (pL.
get<
bool>(
"rap: triple product") && isEpetra)
142 GetOStream(
Warnings1) <<
"Switching from triple product to R x (A x P) since triple product has not been implemented for Epetra.\n";
143 #ifdef KOKKOS_ENABLE_CUDA
144 if (pL.
get<
bool>(
"rap: triple product") && isCuda)
145 GetOStream(
Warnings1) <<
"Switching from triple product to R x (A x P) since triple product has not been implemented for Cuda.\n";
150 if(pL.
isSublist(
"matrixmatrix: kernel params"))
151 APparams->
sublist(
"matrixmatrix: kernel params") = pL.
sublist(
"matrixmatrix: kernel params");
154 APparams->
set(
"compute global constants: temporaries",APparams->
get(
"compute global constants: temporaries",
false));
155 APparams->
set(
"compute global constants",APparams->
get(
"compute global constants",
false));
157 if (coarseLevel.IsAvailable(
"AP reuse data",
this)) {
158 GetOStream(static_cast<MsgType>(
Runtime0 |
Test)) <<
"Reusing previous AP data" << std::endl;
169 AP = MatrixMatrix::Multiply(*A, !doTranspose, *P, !doTranspose, AP, GetOStream(
Statistics2),
170 doFillComplete, doOptimizeStorage, labelstr+std::string(
"MueLu::A*P-")+levelstr.str(), APparams);
175 if(pL.
isSublist(
"matrixmatrix: kernel params"))
176 RAPparams->
sublist(
"matrixmatrix: kernel params") = pL.
sublist(
"matrixmatrix: kernel params");
178 if (coarseLevel.IsAvailable(
"RAP reuse data",
this)) {
179 GetOStream(static_cast<MsgType>(
Runtime0 |
Test)) <<
"Reusing previous RAP data" << std::endl;
192 RAPparams->
set(
"compute global constants: temporaries",RAPparams->
get(
"compute global constants: temporaries",
false));
193 RAPparams->
set(
"compute global constants",
true);
199 if (pL.
get<
bool>(
"transpose: use implicit") ==
true) {
202 Ac = MatrixMatrix::Multiply(*P, doTranspose, *AP, !doTranspose, Ac, GetOStream(
Statistics2),
203 doFillComplete, doOptimizeStorage, labelstr+std::string(
"MueLu::R*(AP)-implicit-")+levelstr.str(), RAPparams);
206 RCP<Matrix> R = Get< RCP<Matrix> >(coarseLevel,
"R");
210 Ac = MatrixMatrix::Multiply(*R, !doTranspose, *AP, !doTranspose, Ac, GetOStream(
Statistics2),
211 doFillComplete, doOptimizeStorage, labelstr+std::string(
"MueLu::R*(AP)-explicit-")+levelstr.str(), RAPparams);
215 if(relativeFloor.
size() > 0) {
219 bool repairZeroDiagonals = pL.
get<
bool>(
"RepairMainDiagonal") || pL.
get<
bool>(
"rap: fix zero diagonals");
220 bool checkAc = pL.
get<
bool>(
"CheckMainDiagonal")|| pL.
get<
bool>(
"rap: fix zero diagonals"); ;
221 if (checkAc || repairZeroDiagonals)
226 params->
set(
"printLoadBalancingInfo",
true);
227 params->
set(
"printCommInfo",
true);
231 if(!Ac.is_null()) {std::ostringstream oss; oss <<
"A_" << coarseLevel.GetLevelID(); Ac->setObjectLabel(oss.str());}
232 Set(coarseLevel,
"A", Ac);
234 APparams->
set(
"graph", AP);
235 Set(coarseLevel,
"AP reuse data", APparams);
236 RAPparams->
set(
"graph", Ac);
237 Set(coarseLevel,
"RAP reuse data", RAPparams);
240 if(pL.
isSublist(
"matrixmatrix: kernel params"))
241 RAPparams->
sublist(
"matrixmatrix: kernel params") = pL.
sublist(
"matrixmatrix: kernel params");
243 if (coarseLevel.IsAvailable(
"RAP reuse data",
this)) {
244 GetOStream(static_cast<MsgType>(
Runtime0 |
Test)) <<
"Reusing previous RAP data" << std::endl;
257 RAPparams->
set(
"compute global constants: temporaries",RAPparams->
get(
"compute global constants: temporaries",
false));
258 RAPparams->
set(
"compute global constants",
true);
260 if (pL.
get<
bool>(
"transpose: use implicit") ==
true) {
262 Ac = MatrixFactory::Build(P->getDomainMap(), Teuchos::as<LO>(0));
267 MultiplyRAP(*P, doTranspose, *A, !doTranspose, *P, !doTranspose, *Ac, doFillComplete,
268 doOptimizeStorage, labelstr+std::string(
"MueLu::R*A*P-implicit-")+levelstr.str(),
272 RCP<Matrix> R = Get< RCP<Matrix> >(coarseLevel,
"R");
273 Ac = MatrixFactory::Build(R->getRowMap(), Teuchos::as<LO>(0));
278 MultiplyRAP(*R, !doTranspose, *A, !doTranspose, *P, !doTranspose, *Ac, doFillComplete,
279 doOptimizeStorage, labelstr+std::string(
"MueLu::R*A*P-explicit-")+levelstr.str(),
284 if(relativeFloor.
size() > 0) {
288 bool repairZeroDiagonals = pL.
get<
bool>(
"RepairMainDiagonal") || pL.
get<
bool>(
"rap: fix zero diagonals");
289 bool checkAc = pL.
get<
bool>(
"CheckMainDiagonal")|| pL.
get<
bool>(
"rap: fix zero diagonals"); ;
290 if (checkAc || repairZeroDiagonals)
297 params->
set(
"printLoadBalancingInfo",
true);
298 params->
set(
"printCommInfo",
true);
302 if(!Ac.is_null()) {std::ostringstream oss; oss <<
"A_" << coarseLevel.GetLevelID(); Ac->setObjectLabel(oss.str());}
303 Set(coarseLevel,
"A", Ac);
305 RAPparams->
set(
"graph", Ac);
306 Set(coarseLevel,
"RAP reuse data", RAPparams);
312 if (transferFacts_.begin() != transferFacts_.end()) {
316 for (std::vector<
RCP<const FactoryBase> >::const_iterator it = transferFacts_.begin(); it != transferFacts_.end(); ++it) {
318 GetOStream(
Runtime0) <<
"RAPFactory: call transfer factory: " << fac->
description() << std::endl;
354 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
358 "MueLu::RAPFactory::AddTransferFactory: Transfer factory is not derived from TwoLevelFactoryBase. "
359 "This is very strange. (Note: you can remove this exception if there's a good reason for)");
361 transferFacts_.push_back(factory);
366 #define MUELU_RAPFACTORY_SHORT
367 #endif // MUELU_RAPFACTORY_DEF_HPP
#define SET_VALID_ENTRY(name)
Exception indicating invalid cast attempted.
virtual std::string getObjectLabel() const
static void RelativeDiagonalBoost(RCP< Xpetra::Matrix< Scalar, LocalOrdinal, GlobalOrdinal, Node > > &A, const Teuchos::ArrayView< const double > &relativeThreshold, Teuchos::FancyOStream &fos)
virtual void CallBuild(Level &requestedLevel) const =0
ParameterList & disableRecursiveValidation()
void Release(const FactoryBase &factory)
Decrement the storage counter for all the inputs of a factory.
T & get(const std::string &name, T def_value)
ParameterList & set(std::string const &name, T const &value, std::string const &docString="", RCP< const ParameterEntryValidator > const &validator=null)
static void MultiplyRAP(const Matrix &R, bool transposeR, const Matrix &A, bool transposeA, const Matrix &P, bool transposeP, Matrix &Ac, bool call_FillComplete_on_result=true, bool doOptimizeStorage=true, const std::string &label=std::string(), const RCP< ParameterList > ¶ms=null)
Timer to be used in factories. Similar to Monitor but with additional timers.
#define TEUCHOS_TEST_FOR_EXCEPTION(throw_exception_test, Exception, msg)
RCP< const ParameterList > GetValidParameterList() const
Return a const parameter list of valid parameters that setParameterList() will accept.
One-liner description of what is happening.
void AddTransferFactory(const RCP< const FactoryBase > &factory)
Add transfer factory in the end of list of transfer factories in RepartitionAcFactory.
static void CheckRepairMainDiagonal(RCP< Xpetra::Matrix< Scalar, LocalOrdinal, GlobalOrdinal, Node >> &Ac, bool const &repairZeroDiagonals, Teuchos::FancyOStream &fos, const typename Teuchos::ScalarTraits< Scalar >::magnitudeType threshold=Teuchos::ScalarTraits< typename Teuchos::ScalarTraits< Scalar >::magnitudeType >::zero())
Print even more statistics.
bool isParameter(const std::string &name) const
TEUCHOS_DEPRECATED RCP< T > rcp(T *p, Dealloc_T dealloc, bool owns_mem)
Class that holds all level-specific information.
bool isSublist(const std::string &name) const
Timer to be used in factories. Similar to SubMonitor but adds a timer level by level.
static std::string PrintMatrixInfo(const Matrix &A, const std::string &msgTag, RCP< const Teuchos::ParameterList > params=Teuchos::null)
ParameterList & sublist(const std::string &name, bool mustAlreadyExist=false, const std::string &docString="")
int GetLevelID() const
Return level number.
Exception throws to report errors in the internal logical of the program.
virtual std::string description() const
Return a simple one-line description of this object.
void Build(Level &fineLevel, Level &coarseLevel) const
Build an object with this factory.
void DeclareInput(Level &fineLevel, Level &coarseLevel) const
Input.