46 #ifndef MUELU_SEMICOARSENPFACTORY_DEF_HPP
47 #define MUELU_SEMICOARSENPFACTORY_DEF_HPP
67 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
71 #define SET_VALID_ENTRY(name) validParamList->setEntry(name, MasterList::getEntry(name))
73 #undef SET_VALID_ENTRY
78 validParamList->
set<
RCP<const FactoryBase> >(
"LineDetection_VertLineIds", Teuchos::null,
"Generating factory for LineDetection information");
79 validParamList->
set<
RCP<const FactoryBase> >(
"LineDetection_Layers", Teuchos::null,
"Generating factory for LineDetection information");
80 validParamList->
set<
RCP<const FactoryBase> >(
"CoarseNumZLayers", Teuchos::null,
"Generating factory for LineDetection information");
82 return validParamList;
85 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
87 Input(fineLevel,
"A");
88 Input(fineLevel,
"Nullspace");
90 Input(fineLevel,
"LineDetection_VertLineIds");
91 Input(fineLevel,
"LineDetection_Layers");
92 Input(fineLevel,
"CoarseNumZLayers");
100 bTransferCoordinates_ =
true;
102 }
else if (bTransferCoordinates_ ==
true){
107 if (myCoordsFact == Teuchos::null) { myCoordsFact = fineLevel.
GetFactoryManager()->GetFactory(
"Coordinates"); }
110 bTransferCoordinates_ =
true;
115 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
117 return BuildP(fineLevel, coarseLevel);
120 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
125 RCP<Matrix> A = Get< RCP<Matrix> > (fineLevel,
"A");
126 RCP<MultiVector> fineNullspace = Get< RCP<MultiVector> > (fineLevel,
"Nullspace");
130 LO CoarsenRate = as<LO>(pL.get<
int>(
"semicoarsen: coarsen rate"));
133 LO BlkSize = A->GetFixedBlockSize();
135 LO Ndofs = rowMap->getNodeNumElements();
136 LO Nnodes = Ndofs/BlkSize;
139 LO FineNumZLayers = Get< LO >(fineLevel,
"CoarseNumZLayers");
140 Teuchos::ArrayRCP<LO> TVertLineId = Get< Teuchos::ArrayRCP<LO> > (fineLevel,
"LineDetection_VertLineIds");
143 LO* LayerId = TLayerId.getRawPtr();
149 GO Ncoarse = MakeSemiCoarsenP(Nnodes,FineNumZLayers,CoarsenRate,LayerId,VertLineId,
150 BlkSize, A, P, theCoarseMap, fineNullspace,coarseNullspace);
153 if (A->IsView(
"stridedMaps") ==
true)
154 P->CreateView(
"stridedMaps", A->getRowMap(
"stridedMaps"), theCoarseMap);
156 P->CreateView(
"stridedMaps", P->getRangeMap(), theCoarseMap);
162 LO CoarseNumZLayers = FineNumZLayers*Ncoarse;
163 CoarseNumZLayers /= Ndofs;
167 Set(coarseLevel,
"P", P);
169 Set(coarseLevel,
"Nullspace", coarseNullspace);
172 if(bTransferCoordinates_) {
176 if (fineLevel.GetLevelID() == 0 &&
181 if (myCoordsFact == Teuchos::null) { myCoordsFact = fineLevel.GetFactoryManager()->GetFactory(
"Coordinates"); }
182 if (fineLevel.IsAvailable(
"Coordinates", myCoordsFact.
get())) {
183 fineCoords = fineLevel.Get<
RCP<xdMV> >(
"Coordinates", myCoordsFact.
get());
197 for (
auto it = z.
begin(); it != z.
end(); ++it) {
198 if(*it > zval_max) zval_max = *it;
199 if(*it < zval_min) zval_min = *it;
202 LO myCoarseZLayers = Teuchos::as<LO>(CoarseNumZLayers);
205 if(myCoarseZLayers == 1) {
206 myZLayerCoords[0] = zval_min;
209 for(LO k = 0; k<myCoarseZLayers; ++k) {
210 myZLayerCoords[k] = k*dz;
218 LO numVertLines = Nnodes / FineNumZLayers;
219 LO numLocalCoarseNodes = numVertLines * myCoarseZLayers;
228 MapFactory::Build (fineCoords->getMap()->lib(),
230 Teuchos::as<size_t>(numLocalCoarseNodes),
231 fineCoords->getMap()->getIndexBase(),
232 fineCoords->getMap()->getComm());
234 coarseCoords->putScalar(-1.0);
240 LO cntCoarseNodes = 0;
241 for( LO vt = 0; vt < TVertLineId.size(); ++vt) {
243 LO curVertLineId = TVertLineId[vt];
245 if(cx[curVertLineId * myCoarseZLayers] == -1.0 &&
246 cy[curVertLineId * myCoarseZLayers] == -1.0) {
248 for (LO n=0; n<myCoarseZLayers; ++n) {
249 cx[curVertLineId * myCoarseZLayers + n] = x[vt];
250 cy[curVertLineId * myCoarseZLayers + n] = y[vt];
251 cz[curVertLineId * myCoarseZLayers + n] = myZLayerCoords[n];
253 cntCoarseNodes += myCoarseZLayers;
257 if(cntCoarseNodes == numLocalCoarseNodes)
break;
261 Set(coarseLevel,
"Coordinates", coarseCoords);
266 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
296 if (Thin == 1) NCpts = (
LO) ceil(temp);
297 else NCpts = (
LO) floor(temp);
301 if (NCpts < 1) NCpts = 1;
311 for (i = 1; i <= NCpts; i++) {
312 (*LayerCpts)[i] = (
LO) floor(di);
319 #define MaxHorNeighborNodes 75
321 template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
378 int NLayers, NVertLines, MaxNnz, NCLayers, MyLine, MyLayer;
379 int *InvLineLayer=NULL, *CptLayers=NULL, StartLayer, NStencilNodes;
380 int BlkRow, dof_j, node_k, *Sub2FullMap=NULL, RowLeng;
381 int i, j, iii, col, count, index, loc, PtRow, PtCol;
382 SC *BandSol=NULL, *BandMat=NULL, TheSum;
383 int *IPIV=NULL, KL, KU, KLU, N, NRHS, LDAB,INFO;
387 int MaxStencilSize, MaxNnzPerRow;
389 int CurRow, LastGuy = -1, NewPtr;
392 LO *Layerdofs = NULL, *Col2Dof = NULL;
404 Nghost = Amat->getColMap()->getNodeNumElements() - Amat->getDomainMap()->getNodeNumElements();
405 if (Nghost < 0) Nghost = 0;
413 for (i = 0; i < Ntotal*DofsPerNode; i++)
414 valptr[i]= LayerId[i/DofsPerNode];
417 importer = Amat->getCrsGraph()->getImporter();
418 if (importer == Teuchos::null) {
419 importer = ImportFactory::Build(Amat->getDomainMap(), Amat->getColMap());
423 valptr= dtemp->getDataNonConst(0);
424 for (i = 0; i < Ntotal*DofsPerNode+Nghost; i++) Layerdofs[i]= valptr[i];
425 valptr= localdtemp->getDataNonConst(0);
426 for (i = 0; i < Ntotal*DofsPerNode; i++) valptr[i]= i%DofsPerNode;
428 valptr= dtemp->getDataNonConst(0);
429 for (i = 0; i < Ntotal*DofsPerNode+Nghost; i++) Col2Dof[i]= valptr[i];
432 NLayers = LayerId[0];
433 NVertLines= VertLineId[0];
435 else { NLayers = -1; NVertLines = -1; }
437 for (i = 1; i < Ntotal; i++) {
438 if ( VertLineId[i] > NVertLines ) NVertLines = VertLineId[i];
439 if ( LayerId[i] > NLayers ) NLayers = LayerId[i];
450 for (i=0; i < Ntotal; i++) {
451 InvLineLayer[ VertLineId[i]+1+LayerId[i]*NVertLines ] = i;
459 NCLayers = FindCpts(nz,CoarsenRate,0, &CptLayers);
468 if (NCLayers < 2) MaxStencilSize = nz;
469 else MaxStencilSize = CptLayers[2];
471 for (i = 3; i <= NCLayers; i++) {
472 if (MaxStencilSize < CptLayers[i]- CptLayers[i-2])
473 MaxStencilSize = CptLayers[i]- CptLayers[i-2];
476 if (MaxStencilSize < nz - CptLayers[NCLayers-1]+1)
477 MaxStencilSize = nz - CptLayers[NCLayers-1]+1;
492 KL = 2*DofsPerNode-1;
493 KU = 2*DofsPerNode-1;
507 Ndofs = DofsPerNode*Ntotal;
508 MaxNnz = 2*DofsPerNode*Ndofs;
513 std::vector<size_t> stridingInfo_;
514 stridingInfo_.push_back(DofsPerNode);
517 coarseMap = StridedMapFactory::Build(rowMap->lib(),
519 NCLayers*NVertLines*DofsPerNode,
531 coarseNullspace = MultiVectorFactory::Build(coarseMap, fineNullspace->getNumVectors());
538 Pptr[0] = 0; Pptr[1] = 0;
548 for (i = 1; i <= MaxNnz; i++) Pcols[i] = -1;
550 for (i = 1; i <= DofsPerNode*Ntotal+1; i++) {
552 count += (2*DofsPerNode);
564 for (MyLine=1; MyLine <= NVertLines; MyLine += 1) {
565 for (iii=1; iii <= NCLayers; iii+= 1) {
567 MyLayer = CptLayers[iii];
580 if (iii != 1 ) StartLayer = CptLayers[iii-1]+1;
583 if (iii != NCLayers) NStencilNodes= CptLayers[iii+1]-StartLayer;
584 else NStencilNodes= NLayers - StartLayer + 1;
587 N = NStencilNodes*DofsPerNode;
594 for (i = 0; i < NStencilNodes*DofsPerNode*DofsPerNode; i++)
596 for (i = 0; i < LDAB*N; i++) BandMat[ i] = 0.0;
603 for (node_k=1; node_k <= NStencilNodes ; node_k++) {
609 BlkRow = InvLineLayer[MyLine+(StartLayer+node_k-2)*NVertLines]+1;
610 Sub2FullMap[node_k] = BlkRow;
623 if (StartLayer+node_k-1 != MyLayer) {
624 for (
int dof_i=0; dof_i < DofsPerNode; dof_i++) {
626 j = (BlkRow-1)*DofsPerNode+dof_i;
629 Amat->getLocalRowView(j, AAcols, AAvals);
632 RowLeng = AAvals.
size();
636 for (i = 0; i < RowLeng; i++) {
637 LayDiff[i] = Layerdofs[Acols[i]]-StartLayer-node_k+2;
645 PtRow = (node_k-1)*DofsPerNode+dof_i+1;
646 for (dof_j=0; dof_j < DofsPerNode; dof_j++) {
647 PtCol = (node_k-1)*DofsPerNode+dof_j + 1;
651 for (i = 0; i < RowLeng; i++) {
652 if ((LayDiff[i] == 0) && (Col2Dof[Acols[i]] == dof_j))
655 index = LDAB*(PtCol-1)+KLU+PtRow-PtCol;
656 BandMat[index] = TheSum;
657 if (node_k != NStencilNodes) {
661 for (i = 0; i < RowLeng; i++) {
662 if ((LayDiff[i] == 1) &&(Col2Dof[Acols[i]]== dof_j))
665 j = PtCol+DofsPerNode;
666 index=LDAB*(j-1)+KLU+PtRow-j;
667 BandMat[index] = TheSum;
673 for (i = 0; i < RowLeng; i++) {
674 if ((LayDiff[i]== -1) &&(Col2Dof[Acols[i]]== dof_j))
677 j = PtCol-DofsPerNode;
678 index=LDAB*(j-1)+KLU+PtRow-j;
679 BandMat[index] = TheSum;
689 for (
int k = 0; k < static_cast<int>(fineNullspace->getNumVectors()); k++) {
692 for (
int dof_i = 0; dof_i < DofsPerNode; dof_i++) {
693 OneCNull[( col-1)*DofsPerNode+dof_i] = OneFNull[ (BlkRow-1)*DofsPerNode+dof_i];
697 for (
int dof_i = 0; dof_i < DofsPerNode; dof_i++) {
700 PtRow = (node_k-1)*DofsPerNode+dof_i+1;
701 index = LDAB*(PtRow-1)+KLU;
702 BandMat[index] = 1.0;
703 BandSol[(dof_i)*DofsPerNode*NStencilNodes+PtRow-1] = 1.;
710 lapack.
GBTRF( N, N, KL, KU, BandMat, LDAB, IPIV, &INFO);
714 lapack.
GBTRS(notrans[0], N, KL, KU, NRHS, BandMat, LDAB, IPIV,
719 for (dof_j=0; dof_j < DofsPerNode; dof_j++) {
720 for (
int dof_i=0; dof_i < DofsPerNode; dof_i++) {
721 for (i =1; i <= NStencilNodes ; i++) {
722 index = (Sub2FullMap[i]-1)*DofsPerNode+dof_i+1;
724 Pcols[loc] = (col-1)*DofsPerNode+dof_j+1;
725 Pvals[loc] = BandSol[dof_j*DofsPerNode*NStencilNodes +
726 (i-1)*DofsPerNode + dof_i];
727 Pptr[index]= Pptr[index] + 1;
743 for (
size_t ii=1; ii <= Pptr[Ntotal*DofsPerNode]-1; ii++) {
744 if (ii == Pptr[CurRow]) {
745 Pptr[CurRow] = LastGuy;
747 while (ii > Pptr[CurRow]) {
748 Pptr[CurRow] = LastGuy;
752 if (Pcols[ii] != -1) {
753 Pcols[NewPtr-1] = Pcols[ii]-1;
754 Pvals[NewPtr-1] = Pvals[ii];
759 for (i = CurRow; i <= Ntotal*DofsPerNode; i++) Pptr[CurRow] = LastGuy;
764 for (i=-Ntotal*DofsPerNode+1; i>= 2 ; i--) {
765 Pptr[i-1] = Pptr[i-2];
773 RCP<CrsMatrix> PCrs = rcp_dynamic_cast<CrsMatrixWrap>(P)->getCrsMatrix();
774 LO nnz = Pptr[Ndofs];
775 PCrs->allocateAllValues(nnz, rcpRowPtr, rcpColumns, rcpValues);
783 for (
LO ii = 0; ii <= Ndofs; ii++) rowPtr[ii] = Pptr[ii];
784 for (
LO ii = 0; ii < nnz; ii++) columns[ii] = Pcols[ii];
785 for (
LO ii = 0; ii < nnz; ii++) values[ii] = Pvals[ii];
786 PCrs->setAllValues(rcpRowPtr, rcpColumns, rcpValues);
787 PCrs->expertStaticFillComplete(coarseMap, Amat->getDomainMap());
790 return NCLayers*NVertLines*DofsPerNode;
794 #define MUELU_SEMICOARSENPFACTORY_SHORT
795 #endif // MUELU_SEMICOARSENPFACTORY_DEF_HPP
ParameterList & set(std::string const &name, T const &value, std::string const &docString="", RCP< const ParameterEntryValidator > const &validator=null)
RCP< const ParameterList > GetValidParameterList() const
Return a const parameter list of valid parameters that setParameterList() will accept.
Timer to be used in factories. Similar to Monitor but with additional timers.
#define TEUCHOS_TEST_FOR_EXCEPTION(throw_exception_test, Exception, msg)
void DeclareInput(Level &fineLevel, Level &coarseLevel) const
Input.
void GBTRF(const OrdinalType &m, const OrdinalType &n, const OrdinalType &kl, const OrdinalType &ku, ScalarType *A, const OrdinalType &lda, OrdinalType *IPIV, OrdinalType *info) const
void Build(Level &fineLevel, Level &coarseLevel) const
Build an object with this factory.
static const NoFactory * get()
TEUCHOS_DEPRECATED RCP< T > rcp(T *p, Dealloc_T dealloc, bool owns_mem)
void BuildP(Level &fineLevel, Level &coarseLevel) const
Abstract Build method.
Class that holds all level-specific information.
LO FindCpts(LO const PtsPerLine, LO const CoarsenRate, LO const Thin, LO **LayerCpts) const
void Set(const std::string &ename, const T &entry, const FactoryBase *factory=NoFactory::get())
static RCP< Vector > Build(const Teuchos::RCP< const Map > &map, bool zeroOut=true)
void GBTRS(const char &TRANS, const OrdinalType &n, const OrdinalType &kl, const OrdinalType &ku, const OrdinalType &nrhs, const ScalarType *A, const OrdinalType &lda, const OrdinalType *IPIV, ScalarType *B, const OrdinalType &ldb, OrdinalType *info) const
#define SET_VALID_ENTRY(name)
#define MaxHorNeighborNodes
LO MakeSemiCoarsenP(LO const Ntotal, LO const nz, LO const CoarsenRate, LO const LayerId[], LO const VertLineId[], LO const DofsPerNode, RCP< Matrix > &Amat, RCP< Matrix > &P, RCP< const Map > &coarseMap, const RCP< MultiVector > fineNullspace, RCP< MultiVector > &coarseNullspace) const
const RCP< const FactoryManagerBase > GetFactoryManager()
returns the current factory manager
int GetLevelID() const
Return level number.
Exception throws to report errors in the internal logical of the program.
void DeclareInput(const std::string &ename, const FactoryBase *factory, const FactoryBase *requestedBy=NoFactory::get())
Callback from FactoryBase::CallDeclareInput() and FactoryBase::DeclareInput()
bool IsAvailable(const std::string &ename, const FactoryBase *factory=NoFactory::get()) const
Test whether a need's value has been saved.