8 #ifndef MUELU_LOCALPERMUTATIONSTRATEGY_DEF_HPP_ 9 #define MUELU_LOCALPERMUTATIONSTRATEGY_DEF_HPP_ 13 #include <Xpetra_MultiVector.hpp> 14 #include <Xpetra_Matrix.hpp> 15 #include <Xpetra_MatrixMatrix.hpp> 16 #include <Xpetra_CrsGraph.hpp> 17 #include <Xpetra_Vector.hpp> 18 #include <Xpetra_VectorFactory.hpp> 19 #include <Xpetra_CrsMatrixWrap.hpp> 21 #include "MueLu_Utilities.hpp" 26 template<
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
29 permWidth_ = nDofsPerNode;
31 result_permvecs_.clear();
35 for(
size_t t = 0; t<nDofsPerNode; t++)
37 std::string cs = ss.str();
42 std::vector<int> newPerm(cs.length(),-1);
43 for(
size_t len=0; len<cs.length(); len++) {
44 newPerm[len] = Teuchos::as<int>(cs[len]-
'0');
46 result_permvecs_.push_back(newPerm);
48 }
while (std::next_permutation(cs.begin(),cs.end()));
51 template<
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
53 #ifndef HAVE_MUELU_INST_COMPLEX_INT_INT // TODO remove this -> check scalar = std::complex 54 size_t nDofsPerNode = 1;
55 if (A->IsView(
"stridedMaps")) {
56 Teuchos::RCP<const Map> permRowMapStrided = A->getRowMap(
"stridedMaps");
57 nDofsPerNode = Teuchos::rcp_dynamic_cast<
const StridedMap>(permRowMapStrided)->getFixedBlockSize();
60 RCP<const Teuchos::Comm<int> > comm = A->getRowMap()->getComm();
63 std::vector<std::pair<GlobalOrdinal,GlobalOrdinal> > RowColPairs;
66 if(permWidth_ != nDofsPerNode)
67 BuildPermutations(nDofsPerNode);
70 LocalOrdinal lonDofsPerNode = Teuchos::as<LocalOrdinal> (nDofsPerNode);
71 Teuchos::ArrayView<const LocalOrdinal> indices;
72 Teuchos::ArrayView<const Scalar> vals;
73 Teuchos::SerialDenseMatrix<LocalOrdinal,Scalar> subBlockMatrix(nDofsPerNode, nDofsPerNode,
true);
74 std::vector<GlobalOrdinal> growIds(nDofsPerNode);
78 LocalOrdinal numLocalNodes = A->getRowMap()->getNodeNumElements()/nDofsPerNode;
79 for (LocalOrdinal node = 0; node < numLocalNodes; ++node) {
82 subBlockMatrix.putScalar();
87 for (LocalOrdinal lrdof = 0; lrdof < lonDofsPerNode; ++lrdof) {
88 GlobalOrdinal grow = getGlobalDofId(A, node, lrdof);
89 growIds[lrdof] = grow;
92 A->getLocalRowView(A->getRowMap()->getLocalElement(grow), indices, vals);
96 for (
size_t j = 0; j < Teuchos::as<size_t>(indices.size()); j++) {
97 if(Teuchos::ScalarTraits<Scalar>::magnitude(vals[j]) > maxVal) {
98 maxVal = Teuchos::ScalarTraits<Scalar>::magnitude(vals[j]);
102 GlobalOrdinal grnodeid = globalDofId2globalNodeId(A,grow);
104 for (
size_t j = 0; j < Teuchos::as<size_t>(indices.size()); j++) {
105 GlobalOrdinal gcol = A->getColMap()->getGlobalElement(indices[j]);
106 GlobalOrdinal gcnodeid = globalDofId2globalNodeId(A,gcol);
107 if (grnodeid == gcnodeid) {
109 subBlockMatrix(lrdof, gcol % nDofsPerNode) = vals[j]/maxVal;
112 subBlockMatrix(lrdof, gcol % nDofsPerNode) = vals[j];
113 std::cout <<
"maxVal never should be zero!!!!" << std::endl;
132 std::vector<Scalar> performance_vector = std::vector<Scalar>(result_permvecs_.size());
133 for (
size_t t = 0; t < result_permvecs_.size(); t++) {
134 std::vector<int> vv = result_permvecs_[t];
136 for(
size_t j=0; j<vv.size(); j++) {
137 value = value * subBlockMatrix(j,vv[j]);
139 performance_vector[t] = value;
153 size_t maxPerformancePermutationIdx = 0;
154 for (
size_t j = 0; j < Teuchos::as<size_t>(performance_vector.size()); j++) {
155 if(Teuchos::ScalarTraits<Scalar>::magnitude(performance_vector[j]) > maxVal) {
156 maxVal = Teuchos::ScalarTraits<Scalar>::magnitude(performance_vector[j]);
157 maxPerformancePermutationIdx = j;
162 std::vector<int> bestPerformancePermutation = result_permvecs_[maxPerformancePermutationIdx];
163 for(
size_t t = 0; t<nDofsPerNode; t++) {
164 RowColPairs.push_back(std::make_pair(growIds[t],growIds[bestPerformancePermutation[t]]));
171 Teuchos::RCP<Vector> Pperm = VectorFactory::Build(A->getRowMap());
172 Teuchos::RCP<Vector> Qperm = VectorFactory::Build(A->getDomainMap());
174 Pperm->putScalar(0.0);
175 Qperm->putScalar(0.0);
177 Teuchos::ArrayRCP<Scalar> PpermData = Pperm->getDataNonConst(0);
178 Teuchos::ArrayRCP<Scalar> QpermData = Qperm->getDataNonConst(0);
180 typename std::vector<std::pair<GlobalOrdinal, GlobalOrdinal> >::iterator p = RowColPairs.begin();
181 while(p != RowColPairs.end() ) {
182 GlobalOrdinal ik = (*p).first;
183 GlobalOrdinal jk = (*p).second;
185 LocalOrdinal lik = A->getRowMap()->getLocalElement(ik);
186 LocalOrdinal ljk = A->getDomainMap()->getLocalElement(jk);
188 Pperm->replaceLocalValue(lik,ik);
189 Qperm->replaceLocalValue(ljk,ik);
191 p = RowColPairs.erase(p);
194 if(RowColPairs.size()>0) GetOStream(
Warnings0) <<
"MueLu::LocalPermutationStrategy: There are Row/col pairs left!" << std::endl;
200 Teuchos::RCP<CrsMatrixWrap> permPTmatrix = Teuchos::rcp(
new CrsMatrixWrap(A->getRowMap(),1,Xpetra::StaticProfile));
201 Teuchos::RCP<CrsMatrixWrap> permQTmatrix = Teuchos::rcp(
new CrsMatrixWrap(A->getRowMap(),1,Xpetra::StaticProfile));
203 for(
size_t row=0; row<A->getNodeNumRows(); row++) {
204 Teuchos::ArrayRCP<GlobalOrdinal> indoutP(1,Teuchos::as<GO>(PpermData[row]));
205 Teuchos::ArrayRCP<GlobalOrdinal> indoutQ(1,Teuchos::as<GO>(QpermData[row]));
206 Teuchos::ArrayRCP<Scalar> valout(1,1.0);
207 permPTmatrix->insertGlobalValues(A->getRowMap()->getGlobalElement(row), indoutP.view(0,indoutP.size()), valout.view(0,valout.size()));
208 permQTmatrix->insertGlobalValues (A->getRowMap()->getGlobalElement(row), indoutQ.view(0,indoutQ.size()), valout.view(0,valout.size()));
211 permPTmatrix->fillComplete();
212 permQTmatrix->fillComplete();
226 Teuchos::RCP<Matrix> ApermQt = Xpetra::MatrixMatrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Multiply(*A,
false, *permQTmatrix,
false, GetOStream(
Statistics2),
true,
true);
227 Teuchos::RCP<Matrix> permPApermQt = Xpetra::MatrixMatrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Multiply(*permPmatrix,
false, *ApermQt,
false, GetOStream(
Statistics2),
true,
true);
236 Teuchos::RCP<Vector> diagVec = VectorFactory::Build(permPApermQt->getRowMap(),
true);
237 Teuchos::RCP<Vector> invDiagVec = VectorFactory::Build(permPApermQt->getRowMap(),
true);
238 Teuchos::ArrayRCP< const Scalar > diagVecData = diagVec->getData(0);
239 Teuchos::ArrayRCP< Scalar > invDiagVecData = invDiagVec->getDataNonConst(0);
241 LO lCntZeroDiagonals = 0;
242 permPApermQt->getLocalDiagCopy(*diagVec);
243 for(
size_t i = 0; i<diagVec->getMap()->getNodeNumElements(); ++i) {
244 if(diagVecData[i] != 0.0)
245 invDiagVecData[i] = 1/diagVecData[i];
247 invDiagVecData[i] = 1.0;
254 GO gCntZeroDiagonals = 0;
255 GO glCntZeroDiagonals = Teuchos::as<GlobalOrdinal>(lCntZeroDiagonals);
256 MueLu_sumAll(comm,glCntZeroDiagonals,gCntZeroDiagonals);
257 GetOStream(
Statistics0) <<
"MueLu::LocalPermutationStrategy: found " << gCntZeroDiagonals <<
" zeros on diagonal" << std::endl;
260 Teuchos::RCP<CrsMatrixWrap> diagScalingOp = Teuchos::rcp(
new CrsMatrixWrap(permPApermQt->getRowMap(),1,Xpetra::StaticProfile));
262 for(
size_t row=0; row<A->getNodeNumRows(); row++) {
263 Teuchos::ArrayRCP<GlobalOrdinal> indout(1,permPApermQt->getRowMap()->getGlobalElement(row));
264 Teuchos::ArrayRCP<Scalar> valout(1,invDiagVecData[row]);
265 diagScalingOp->insertGlobalValues(A->getRowMap()->getGlobalElement(row), indout.view(0,indout.size()), valout.view(0,valout.size()));
267 diagScalingOp->fillComplete();
269 Teuchos::RCP<Matrix> scaledA = Xpetra::MatrixMatrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Multiply(*diagScalingOp,
false, *permPApermQt,
false, GetOStream(
Statistics2),
true,
true);
270 currentLevel.
Set(
"A", Teuchos::rcp_dynamic_cast<Matrix>(scaledA), genFactory);
272 currentLevel.
Set(
"permA", Teuchos::rcp_dynamic_cast<Matrix>(permPApermQt), genFactory);
273 currentLevel.
Set(
"permP", Teuchos::rcp_dynamic_cast<Matrix>(permPmatrix), genFactory);
274 currentLevel.
Set(
"permQT", Teuchos::rcp_dynamic_cast<Matrix>(permQTmatrix), genFactory);
275 currentLevel.
Set(
"permScaling", Teuchos::rcp_dynamic_cast<Matrix>(diagScalingOp), genFactory);
279 Teuchos::RCP<Vector> diagPVec = VectorFactory::Build(permPmatrix->getRowMap(),
true);
280 permPmatrix->getLocalDiagCopy(*diagPVec);
281 Teuchos::ArrayRCP< const Scalar > diagPVecData = diagPVec->getData(0);
282 GlobalOrdinal lNumRowPermutations = 0;
283 GlobalOrdinal gNumRowPermutations = 0;
284 for(
size_t i = 0; i<diagPVec->getMap()->getNodeNumElements(); ++i) {
285 if(diagPVecData[i] == 0.0) {
286 lNumRowPermutations++;
291 MueLu_sumAll(diagPVec->getMap()->getComm(), lNumRowPermutations, gNumRowPermutations);
295 Teuchos::RCP<Vector> diagQTVec = VectorFactory::Build(permQTmatrix->getRowMap(),
true);
296 permQTmatrix->getLocalDiagCopy(*diagQTVec);
297 Teuchos::ArrayRCP< const Scalar > diagQTVecData = diagQTVec->getData(0);
298 GlobalOrdinal lNumColPermutations = 0;
299 GlobalOrdinal gNumColPermutations = 0;
300 for(
size_t i = 0; i<diagQTVec->getMap()->getNodeNumElements(); ++i) {
301 if(diagQTVecData[i] == 0.0) {
302 lNumColPermutations++;
307 MueLu_sumAll(diagQTVec->getMap()->getComm(), lNumColPermutations, gNumColPermutations);
309 currentLevel.
Set(
"#RowPermutations", gNumRowPermutations, genFactory);
310 currentLevel.
Set(
"#ColPermutations", gNumColPermutations, genFactory);
311 currentLevel.
Set(
"#WideRangeRowPermutations", 0, genFactory);
312 currentLevel.
Set(
"#WideRangeColPermutations", 0, genFactory);
314 GetOStream(
Statistics0) <<
"#Row permutations/max possible permutations: " << gNumRowPermutations <<
"/" << diagPVec->getMap()->getGlobalNumElements() << std::endl;
315 GetOStream(
Statistics0) <<
"#Column permutations/max possible permutations: " << gNumColPermutations <<
"/" << diagQTVec->getMap()->getGlobalNumElements() << std::endl;
317 #endif // #ifndef HAVE_MUELU_INST_COMPLEX_INT_INT 320 template<
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
322 size_t nDofsPerNode = 1;
323 if (A->IsView(
"stridedMaps")) {
324 Teuchos::RCP<const Map> permRowMapStrided = A->getRowMap(
"stridedMaps");
325 nDofsPerNode = Teuchos::rcp_dynamic_cast<
const StridedMap>(permRowMapStrided)->getFixedBlockSize();
328 LocalOrdinal localDofId = localNodeId * nDofsPerNode + localDof;
330 return A->getRowMap()->getGlobalElement(localDofId);
333 template<
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
335 size_t nDofsPerNode = 1;
336 if (A->IsView(
"stridedMaps")) {
337 Teuchos::RCP<const Map> permRowMapStrided = A->getRowMap(
"stridedMaps");
338 nDofsPerNode = Teuchos::rcp_dynamic_cast<
const StridedMap>(permRowMapStrided)->getFixedBlockSize();
341 return (GlobalOrdinal) grid / (GlobalOrdinal)nDofsPerNode;
Important warning messages (one line)
static RCP< Matrix > Transpose(Matrix &Op, bool optimizeTranspose=false, const std::string &label=std::string())
Transpose a Xpetra::Matrix.
void BuildPermutation(const Teuchos::RCP< Matrix > &A, const Teuchos::RCP< const Map > permRowMap, Level ¤tLevel, const FactoryBase *genFactory) const
build permutation operators
Namespace for MueLu classes and methods.
Print even more statistics.
GlobalOrdinal getGlobalDofId(const Teuchos::RCP< Matrix > &A, LocalOrdinal localNodeId, LocalOrdinal localDof) const
Base class for factories (e.g., R, P, and A_coarse).
Print statistics that do not involve significant additional computation.
#define MueLu_sumAll(rcpComm, in, out)
Class that holds all level-specific information.
void BuildPermutations(size_t nDofsPerNode) const
GlobalOrdinal globalDofId2globalNodeId(const Teuchos::RCP< Matrix > &A, GlobalOrdinal grid) const
void Set(const std::string &ename, const T &entry, const FactoryBase *factory=NoFactory::get())