MueLu  Version of the Day
MueLu_LocalPermutationStrategy_def.hpp
Go to the documentation of this file.
1 /*
2  * MueLu_LocalPermutationStrategy_def.hpp
3  *
4  * Created on: Feb 19, 2013
5  * Author: tobias
6  */
7 
8 #ifndef MUELU_LOCALPERMUTATIONSTRATEGY_DEF_HPP_
9 #define MUELU_LOCALPERMUTATIONSTRATEGY_DEF_HPP_
10 
11 #include <algorithm>
12 
13 #include <Xpetra_MultiVector.hpp>
14 #include <Xpetra_Matrix.hpp>
15 #include <Xpetra_MatrixMatrix.hpp>
16 #include <Xpetra_CrsGraph.hpp>
17 #include <Xpetra_Vector.hpp>
18 #include <Xpetra_VectorFactory.hpp>
19 #include <Xpetra_CrsMatrixWrap.hpp>
20 
21 #include "MueLu_Utilities.hpp"
23 
24 namespace MueLu {
25 
26  template<class Scalar, class LocalOrdinal, class GlobalOrdinal, class Node>
28 
29  permWidth_ = nDofsPerNode;
30 
31  result_permvecs_.clear();
32 
33  // build permutation string
34  std::stringstream ss;
35  for(size_t t = 0; t<nDofsPerNode; t++)
36  ss << t;
37  std::string cs = ss.str();
38  //std::vector<std::string> result_perms;
39  do {
40  //result_perms.push_back(cs);
41 
42  std::vector<int> newPerm(cs.length(),-1);
43  for(size_t len=0; len<cs.length(); len++) {
44  newPerm[len] = Teuchos::as<int>(cs[len]-'0');
45  }
46  result_permvecs_.push_back(newPerm);
47 
48  } while (std::next_permutation(cs.begin(),cs.end()));
49  }
50 
51  template<class Scalar, class LocalOrdinal, class GlobalOrdinal, class Node>
52  void LocalPermutationStrategy<Scalar, LocalOrdinal, GlobalOrdinal, Node>::BuildPermutation(const Teuchos::RCP<Matrix> & A, const Teuchos::RCP<const Map> permRowMap, Level & currentLevel, const FactoryBase* genFactory) const {
53 #ifndef HAVE_MUELU_INST_COMPLEX_INT_INT // TODO remove this -> check scalar = std::complex
54  size_t nDofsPerNode = 1;
55  if (A->IsView("stridedMaps")) {
56  Teuchos::RCP<const Map> permRowMapStrided = A->getRowMap("stridedMaps");
57  nDofsPerNode = Teuchos::rcp_dynamic_cast<const StridedMap>(permRowMapStrided)->getFixedBlockSize();
58  }
59 
60  RCP<const Teuchos::Comm<int> > comm = A->getRowMap()->getComm();
61 
63  std::vector<std::pair<GlobalOrdinal,GlobalOrdinal> > RowColPairs;
64 
65  // check whether we have to (re)build the permutation vector
66  if(permWidth_ != nDofsPerNode)
67  BuildPermutations(nDofsPerNode);
68 
69  // declare local variables used inside loop
70  LocalOrdinal lonDofsPerNode = Teuchos::as<LocalOrdinal> (nDofsPerNode);
71  Teuchos::ArrayView<const LocalOrdinal> indices;
72  Teuchos::ArrayView<const Scalar> vals;
73  Teuchos::SerialDenseMatrix<LocalOrdinal,Scalar> subBlockMatrix(nDofsPerNode, nDofsPerNode, true);
74  std::vector<GlobalOrdinal> growIds(nDofsPerNode);
75 
76  // loop over local nodes
77  // TODO what about nOffset?
78  LocalOrdinal numLocalNodes = A->getRowMap()->getNodeNumElements()/nDofsPerNode;
79  for (LocalOrdinal node = 0; node < numLocalNodes; ++node) {
80 
81  // zero out block matrix
82  subBlockMatrix.putScalar();
83 
84  // loop over all DOFs in current node
85  // Note: were assuming constant number of Dofs per node here!
86  // TODO This is more complicated for variable dofs per node
87  for (LocalOrdinal lrdof = 0; lrdof < lonDofsPerNode; ++lrdof) {
88  GlobalOrdinal grow = getGlobalDofId(A, node, lrdof);
89  growIds[lrdof] = grow;
90 
91  // extract local row information from matrix
92  A->getLocalRowView(A->getRowMap()->getLocalElement(grow), indices, vals);
93 
94  // find column entry with max absolute value
95  Scalar maxVal = 0.0;
96  for (size_t j = 0; j < Teuchos::as<size_t>(indices.size()); j++) {
97  if(Teuchos::ScalarTraits<Scalar>::magnitude(vals[j]) > maxVal) {
98  maxVal = Teuchos::ScalarTraits<Scalar>::magnitude(vals[j]);
99  }
100  }
101 
102  GlobalOrdinal grnodeid = globalDofId2globalNodeId(A,grow);
103 
104  for (size_t j = 0; j < Teuchos::as<size_t>(indices.size()); j++) {
105  GlobalOrdinal gcol = A->getColMap()->getGlobalElement(indices[j]);
106  GlobalOrdinal gcnodeid = globalDofId2globalNodeId(A,gcol); // -> global node id
107  if (grnodeid == gcnodeid) {
108  if(maxVal != 0.0) {
109  subBlockMatrix(lrdof, gcol % nDofsPerNode) = vals[j]/maxVal;
110  } else
111  {
112  subBlockMatrix(lrdof, gcol % nDofsPerNode) = vals[j]; // there is a problem
113  std::cout << "maxVal never should be zero!!!!" << std::endl;
114  }
115  }
116  }
117  }
118 
119  // now we have the sub block matrix
120 
121  // build permutation string
122  /*std::stringstream ss;
123  for(size_t t = 0; t<nDofsPerNode; t++)
124  ss << t;
125  std::string cs = ss.str();
126  std::vector<std::string> result_perms;
127  do {
128  result_perms.push_back(cs);
129  //std::cout << result_perms.back() << std::endl;
130  } while (std::next_permutation(cs.begin(),cs.end()));*/
131 
132  std::vector<Scalar> performance_vector = std::vector<Scalar>(result_permvecs_.size());
133  for (size_t t = 0; t < result_permvecs_.size(); t++) {
134  std::vector<int> vv = result_permvecs_[t];
135  Scalar value = 1.0;
136  for(size_t j=0; j<vv.size(); j++) {
137  value = value * subBlockMatrix(j,vv[j]);
138  }
139  performance_vector[t] = value;
140  }
141  /*for(size_t t = 0; t < result_perms.size(); t++) {
142  std::string s = result_perms[t];
143  Scalar value = 1.0;
144  for(size_t len=0; len<s.length(); len++) {
145  int col = Teuchos::as<int>(s[len]-'0');
146  value = value * subBlockMatrix(len,col);
147  }
148  performance_vector[t] = value;
149  }*/
150 
151  // find permutation with maximum performance value
152  Scalar maxVal = 0.0;
153  size_t maxPerformancePermutationIdx = 0;
154  for (size_t j = 0; j < Teuchos::as<size_t>(performance_vector.size()); j++) {
155  if(Teuchos::ScalarTraits<Scalar>::magnitude(performance_vector[j]) > maxVal) {
156  maxVal = Teuchos::ScalarTraits<Scalar>::magnitude(performance_vector[j]);
157  maxPerformancePermutationIdx = j;
158  }
159  }
160 
161  // build RowColPairs for best permutation
162  std::vector<int> bestPerformancePermutation = result_permvecs_[maxPerformancePermutationIdx];
163  for(size_t t = 0; t<nDofsPerNode; t++) {
164  RowColPairs.push_back(std::make_pair(growIds[t],growIds[bestPerformancePermutation[t]]));
165  }
166 
167  } // end loop over local nodes
168 
169 
170  // build Pperm and Qperm vectors
171  Teuchos::RCP<Vector> Pperm = VectorFactory::Build(A->getRowMap());
172  Teuchos::RCP<Vector> Qperm = VectorFactory::Build(A->getDomainMap());
173 
174  Pperm->putScalar(0.0);
175  Qperm->putScalar(0.0);
176 
177  Teuchos::ArrayRCP<Scalar> PpermData = Pperm->getDataNonConst(0);
178  Teuchos::ArrayRCP<Scalar> QpermData = Qperm->getDataNonConst(0);
179 
180  typename std::vector<std::pair<GlobalOrdinal, GlobalOrdinal> >::iterator p = RowColPairs.begin();
181  while(p != RowColPairs.end() ) {
182  GlobalOrdinal ik = (*p).first;
183  GlobalOrdinal jk = (*p).second;
184 
185  LocalOrdinal lik = A->getRowMap()->getLocalElement(ik);
186  LocalOrdinal ljk = A->getDomainMap()->getLocalElement(jk);
187 
188  Pperm->replaceLocalValue(lik,ik);
189  Qperm->replaceLocalValue(ljk,ik);
190 
191  p = RowColPairs.erase(p);
192  }
193 
194  if(RowColPairs.size()>0) GetOStream(Warnings0) << "MueLu::LocalPermutationStrategy: There are Row/col pairs left!" << std::endl;
195 
196  // Qperm should be fine
197  // build matrices
198 
199  // create new empty Matrix
200  Teuchos::RCP<CrsMatrixWrap> permPTmatrix = Teuchos::rcp(new CrsMatrixWrap(A->getRowMap(),1,Xpetra::StaticProfile));
201  Teuchos::RCP<CrsMatrixWrap> permQTmatrix = Teuchos::rcp(new CrsMatrixWrap(A->getRowMap(),1,Xpetra::StaticProfile));
202 
203  for(size_t row=0; row<A->getNodeNumRows(); row++) {
204  Teuchos::ArrayRCP<GlobalOrdinal> indoutP(1,Teuchos::as<GO>(PpermData[row])); // column idx for Perm^T
205  Teuchos::ArrayRCP<GlobalOrdinal> indoutQ(1,Teuchos::as<GO>(QpermData[row])); // column idx for Qperm
206  Teuchos::ArrayRCP<Scalar> valout(1,1.0);
207  permPTmatrix->insertGlobalValues(A->getRowMap()->getGlobalElement(row), indoutP.view(0,indoutP.size()), valout.view(0,valout.size()));
208  permQTmatrix->insertGlobalValues (A->getRowMap()->getGlobalElement(row), indoutQ.view(0,indoutQ.size()), valout.view(0,valout.size()));
209  }
210 
211  permPTmatrix->fillComplete();
212  permQTmatrix->fillComplete();
213 
214  Teuchos::RCP<Matrix> permPmatrix = Utils2::Transpose(*permPTmatrix,true);
215 
216  /*for(size_t row=0; row<permPTmatrix->getNodeNumRows(); row++) {
217  if(permPTmatrix->getNumEntriesInLocalRow(row) != 1)
218  GetOStream(Warnings0) <<"#entries in row " << row << " of permPTmatrix is " << permPTmatrix->getNumEntriesInLocalRow(row) << std::endl;
219  if(permPmatrix->getNumEntriesInLocalRow(row) != 1)
220  GetOStream(Warnings0) <<"#entries in row " << row << " of permPmatrix is " << permPmatrix->getNumEntriesInLocalRow(row) << std::endl;
221  if(permQTmatrix->getNumEntriesInLocalRow(row) != 1)
222  GetOStream(Warnings0) <<"#entries in row " << row << " of permQmatrix is " << permQTmatrix->getNumEntriesInLocalRow(row) << std::endl;
223  }*/
224 
225  // build permP * A * permQT
226  Teuchos::RCP<Matrix> ApermQt = Xpetra::MatrixMatrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Multiply(*A, false, *permQTmatrix, false, GetOStream(Statistics2),true,true);
227  Teuchos::RCP<Matrix> permPApermQt = Xpetra::MatrixMatrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Multiply(*permPmatrix, false, *ApermQt, false, GetOStream(Statistics2),true,true);
228 
229  /*
230  MueLu::Utils<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Write("A.mat", *A);
231  MueLu::Utils<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Write("permP.mat", *permPmatrix);
232  MueLu::Utils<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Write("permQt.mat", *permQTmatrix);
233  MueLu::Utils<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Write("permPApermQt.mat", *permPApermQt);
234  */
235  // build scaling matrix
236  Teuchos::RCP<Vector> diagVec = VectorFactory::Build(permPApermQt->getRowMap(),true);
237  Teuchos::RCP<Vector> invDiagVec = VectorFactory::Build(permPApermQt->getRowMap(),true);
238  Teuchos::ArrayRCP< const Scalar > diagVecData = diagVec->getData(0);
239  Teuchos::ArrayRCP< Scalar > invDiagVecData = invDiagVec->getDataNonConst(0);
240 
241  LO lCntZeroDiagonals = 0;
242  permPApermQt->getLocalDiagCopy(*diagVec);
243  for(size_t i = 0; i<diagVec->getMap()->getNodeNumElements(); ++i) {
244  if(diagVecData[i] != 0.0)
245  invDiagVecData[i] = 1/diagVecData[i];
246  else {
247  invDiagVecData[i] = 1.0;
248  lCntZeroDiagonals++;
249  //GetOStream(Statistics0) << "MueLu::LocalPermutationStrategy: found zero on diagonal in row " << i << std::endl;
250  }
251  }
252 
253 #if 0
254  GO gCntZeroDiagonals = 0;
255  GO glCntZeroDiagonals = Teuchos::as<GlobalOrdinal>(lCntZeroDiagonals); /* LO->GO conversion */
256  MueLu_sumAll(comm,glCntZeroDiagonals,gCntZeroDiagonals);
257  GetOStream(Statistics0) << "MueLu::LocalPermutationStrategy: found " << gCntZeroDiagonals << " zeros on diagonal" << std::endl;
258 #endif
259 
260  Teuchos::RCP<CrsMatrixWrap> diagScalingOp = Teuchos::rcp(new CrsMatrixWrap(permPApermQt->getRowMap(),1,Xpetra::StaticProfile));
261 
262  for(size_t row=0; row<A->getNodeNumRows(); row++) {
263  Teuchos::ArrayRCP<GlobalOrdinal> indout(1,permPApermQt->getRowMap()->getGlobalElement(row)); // column idx for Perm^T
264  Teuchos::ArrayRCP<Scalar> valout(1,invDiagVecData[row]);
265  diagScalingOp->insertGlobalValues(A->getRowMap()->getGlobalElement(row), indout.view(0,indout.size()), valout.view(0,valout.size()));
266  }
267  diagScalingOp->fillComplete();
268 
269  Teuchos::RCP<Matrix> scaledA = Xpetra::MatrixMatrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Multiply(*diagScalingOp, false, *permPApermQt, false, GetOStream(Statistics2), true, true);
270  currentLevel.Set("A", Teuchos::rcp_dynamic_cast<Matrix>(scaledA), genFactory);
271 
272  currentLevel.Set("permA", Teuchos::rcp_dynamic_cast<Matrix>(permPApermQt), genFactory);
273  currentLevel.Set("permP", Teuchos::rcp_dynamic_cast<Matrix>(permPmatrix), genFactory);
274  currentLevel.Set("permQT", Teuchos::rcp_dynamic_cast<Matrix>(permQTmatrix), genFactory);
275  currentLevel.Set("permScaling", Teuchos::rcp_dynamic_cast<Matrix>(diagScalingOp), genFactory);
276 
278  // count zeros on diagonal in P -> number of row permutations
279  Teuchos::RCP<Vector> diagPVec = VectorFactory::Build(permPmatrix->getRowMap(),true);
280  permPmatrix->getLocalDiagCopy(*diagPVec);
281  Teuchos::ArrayRCP< const Scalar > diagPVecData = diagPVec->getData(0);
282  GlobalOrdinal lNumRowPermutations = 0;
283  GlobalOrdinal gNumRowPermutations = 0;
284  for(size_t i = 0; i<diagPVec->getMap()->getNodeNumElements(); ++i) {
285  if(diagPVecData[i] == 0.0) {
286  lNumRowPermutations++;
287  }
288  }
289 
290  // sum up all entries in multipleColRequests over all processors
291  MueLu_sumAll(diagPVec->getMap()->getComm(), lNumRowPermutations, gNumRowPermutations);
292 
294  // count zeros on diagonal in Q^T -> number of column permutations
295  Teuchos::RCP<Vector> diagQTVec = VectorFactory::Build(permQTmatrix->getRowMap(),true);
296  permQTmatrix->getLocalDiagCopy(*diagQTVec);
297  Teuchos::ArrayRCP< const Scalar > diagQTVecData = diagQTVec->getData(0);
298  GlobalOrdinal lNumColPermutations = 0;
299  GlobalOrdinal gNumColPermutations = 0;
300  for(size_t i = 0; i<diagQTVec->getMap()->getNodeNumElements(); ++i) {
301  if(diagQTVecData[i] == 0.0) {
302  lNumColPermutations++;
303  }
304  }
305 
306  // sum up all entries in multipleColRequests over all processors
307  MueLu_sumAll(diagQTVec->getMap()->getComm(), lNumColPermutations, gNumColPermutations);
308 
309  currentLevel.Set("#RowPermutations", gNumRowPermutations, genFactory/*this*/);
310  currentLevel.Set("#ColPermutations", gNumColPermutations, genFactory/*this*/);
311  currentLevel.Set("#WideRangeRowPermutations", 0, genFactory/*this*/);
312  currentLevel.Set("#WideRangeColPermutations", 0, genFactory/*this*/);
313 
314  GetOStream(Statistics0) << "#Row permutations/max possible permutations: " << gNumRowPermutations << "/" << diagPVec->getMap()->getGlobalNumElements() << std::endl;
315  GetOStream(Statistics0) << "#Column permutations/max possible permutations: " << gNumColPermutations << "/" << diagQTVec->getMap()->getGlobalNumElements() << std::endl;
316 
317 #endif // #ifndef HAVE_MUELU_INST_COMPLEX_INT_INT
318  }
319 
320  template<class Scalar, class LocalOrdinal, class GlobalOrdinal, class Node>
321  GlobalOrdinal LocalPermutationStrategy<Scalar, LocalOrdinal, GlobalOrdinal, Node>::getGlobalDofId(const Teuchos::RCP<Matrix> & A, LocalOrdinal localNodeId, LocalOrdinal localDof) const {
322  size_t nDofsPerNode = 1;
323  if (A->IsView("stridedMaps")) {
324  Teuchos::RCP<const Map> permRowMapStrided = A->getRowMap("stridedMaps");
325  nDofsPerNode = Teuchos::rcp_dynamic_cast<const StridedMap>(permRowMapStrided)->getFixedBlockSize();
326  }
327 
328  LocalOrdinal localDofId = localNodeId * nDofsPerNode + localDof;
329 
330  return A->getRowMap()->getGlobalElement(localDofId);
331  }
332 
333  template<class Scalar, class LocalOrdinal, class GlobalOrdinal, class Node>
334  GlobalOrdinal LocalPermutationStrategy<Scalar, LocalOrdinal, GlobalOrdinal, Node>::globalDofId2globalNodeId( const Teuchos::RCP<Matrix> & A, GlobalOrdinal grid ) const {
335  size_t nDofsPerNode = 1;
336  if (A->IsView("stridedMaps")) {
337  Teuchos::RCP<const Map> permRowMapStrided = A->getRowMap("stridedMaps");
338  nDofsPerNode = Teuchos::rcp_dynamic_cast<const StridedMap>(permRowMapStrided)->getFixedBlockSize();
339  }
340 
341  return (GlobalOrdinal) grid / (GlobalOrdinal)nDofsPerNode; // TODO what about nOffset???
342  }
343 
344 } // namespace MueLu
345 
346 
347 #endif /* MUELU_LOCALPERMUTATIONSTRATEGY_DEF_HPP_ */
Important warning messages (one line)
static RCP< Matrix > Transpose(Matrix &Op, bool optimizeTranspose=false, const std::string &label=std::string())
Transpose a Xpetra::Matrix.
void BuildPermutation(const Teuchos::RCP< Matrix > &A, const Teuchos::RCP< const Map > permRowMap, Level &currentLevel, const FactoryBase *genFactory) const
build permutation operators
Namespace for MueLu classes and methods.
Print even more statistics.
GlobalOrdinal getGlobalDofId(const Teuchos::RCP< Matrix > &A, LocalOrdinal localNodeId, LocalOrdinal localDof) const
Base class for factories (e.g., R, P, and A_coarse).
Print statistics that do not involve significant additional computation.
#define MueLu_sumAll(rcpComm, in, out)
Class that holds all level-specific information.
Definition: MueLu_Level.hpp:99
void BuildPermutations(size_t nDofsPerNode) const
GlobalOrdinal globalDofId2globalNodeId(const Teuchos::RCP< Matrix > &A, GlobalOrdinal grid) const
void Set(const std::string &ename, const T &entry, const FactoryBase *factory=NoFactory::get())