MueLu  Version of the Day
MueLu_UncoupledAggregationFactory_kokkos_def.hpp
Go to the documentation of this file.
1 // @HEADER
2 //
3 // ***********************************************************************
4 //
5 // MueLu: A package for multigrid based preconditioning
6 // Copyright 2012 Sandia Corporation
7 //
8 // Under the terms of Contract DE-AC04-94AL85000 with Sandia Corporation,
9 // the U.S. Government retains certain rights in this software.
10 //
11 // Redistribution and use in source and binary forms, with or without
12 // modification, are permitted provided that the following conditions are
13 // met:
14 //
15 // 1. Redistributions of source code must retain the above copyright
16 // notice, this list of conditions and the following disclaimer.
17 //
18 // 2. Redistributions in binary form must reproduce the above copyright
19 // notice, this list of conditions and the following disclaimer in the
20 // documentation and/or other materials provided with the distribution.
21 //
22 // 3. Neither the name of the Corporation nor the names of the
23 // contributors may be used to endorse or promote products derived from
24 // this software without specific prior written permission.
25 //
26 // THIS SOFTWARE IS PROVIDED BY SANDIA CORPORATION "AS IS" AND ANY
27 // EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
28 // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
29 // PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL SANDIA CORPORATION OR THE
30 // CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
31 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
32 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
33 // PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
34 // LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
35 // NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
36 // SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
37 //
38 // Questions? Contact
39 // Jonathan Hu (jhu@sandia.gov)
40 // Andrey Prokopenko (aprokop@sandia.gov)
41 // Ray Tuminaro (rstumin@sandia.gov)
42 //
43 // ***********************************************************************
44 //
45 // @HEADER
46 #ifndef MUELU_UNCOUPLEDAGGREGATIONFACTORY_KOKKOS_DEF_HPP_
47 #define MUELU_UNCOUPLEDAGGREGATIONFACTORY_KOKKOS_DEF_HPP_
48 
49 #ifdef HAVE_MUELU_KOKKOS_REFACTOR
50 
51 #include <climits>
52 
53 #include <Xpetra_Map.hpp>
54 #include <Xpetra_Vector.hpp>
55 #include <Xpetra_MultiVectorFactory.hpp>
56 #include <Xpetra_VectorFactory.hpp>
57 
59 
60 #include "MueLu_OnePtAggregationAlgorithm_kokkos.hpp"
61 #include "MueLu_PreserveDirichletAggregationAlgorithm_kokkos.hpp"
62 #include "MueLu_IsolatedNodeAggregationAlgorithm_kokkos.hpp"
63 
64 #include "MueLu_AggregationPhase1Algorithm_kokkos.hpp"
65 #include "MueLu_AggregationPhase2aAlgorithm_kokkos.hpp"
66 #include "MueLu_AggregationPhase2bAlgorithm_kokkos.hpp"
67 #include "MueLu_AggregationPhase3Algorithm_kokkos.hpp"
68 
69 #include "MueLu_Level.hpp"
70 #include "MueLu_LWGraph_kokkos.hpp"
71 #include "MueLu_Aggregates_kokkos.hpp"
72 #include "MueLu_MasterList.hpp"
73 #include "MueLu_Monitor.hpp"
74 #include "MueLu_AmalgamationInfo.hpp"
75 #include "MueLu_Utilities.hpp" // for sum_all and similar stuff...
76 
77 namespace MueLu {
78 
79  template <class LocalOrdinal, class GlobalOrdinal, class Node>
80  UncoupledAggregationFactory_kokkos<LocalOrdinal, GlobalOrdinal, Node>::UncoupledAggregationFactory_kokkos()
81  : bDefinitionPhase_(true)
82  { }
83 
84  template <class LocalOrdinal, class GlobalOrdinal, class Node>
85  RCP<const ParameterList> UncoupledAggregationFactory_kokkos<LocalOrdinal, GlobalOrdinal, Node>::GetValidParameterList() const {
86  RCP<ParameterList> validParamList = rcp(new ParameterList());
87 
88  // Aggregation parameters (used in aggregation algorithms)
89  // TODO introduce local member function for each aggregation algorithm such that each aggregation algorithm can define its own parameters
90 
91  typedef Teuchos::StringToIntegralParameterEntryValidator<int> validatorType;
92 #define SET_VALID_ENTRY(name) validParamList->setEntry(name, MasterList::getEntry(name))
93  SET_VALID_ENTRY("aggregation: max agg size");
94  SET_VALID_ENTRY("aggregation: min agg size");
95  SET_VALID_ENTRY("aggregation: max selected neighbors");
96  SET_VALID_ENTRY("aggregation: ordering");
97  validParamList->getEntry("aggregation: ordering").setValidator(
98  rcp(new validatorType(Teuchos::tuple<std::string>("natural", "graph", "random"), "aggregation: ordering")));
99  SET_VALID_ENTRY("aggregation: enable phase 1");
100  SET_VALID_ENTRY("aggregation: enable phase 2a");
101  SET_VALID_ENTRY("aggregation: enable phase 2b");
102  SET_VALID_ENTRY("aggregation: enable phase 3");
103  SET_VALID_ENTRY("aggregation: preserve Dirichlet points");
104  SET_VALID_ENTRY("aggregation: allow user-specified singletons");
105 #undef SET_VALID_ENTRY
106 
107  // general variables needed in AggregationFactory
108  validParamList->set< RCP<const FactoryBase> >("Graph", null, "Generating factory of the graph");
109  validParamList->set< RCP<const FactoryBase> >("DofsPerNode", null, "Generating factory for variable \'DofsPerNode\', usually the same as for \'Graph\'");
110 
111  // special variables necessary for OnePtAggregationAlgorithm
112  validParamList->set< std::string > ("OnePt aggregate map name", "", "Name of input map for single node aggregates. (default='')");
113  validParamList->set< std::string > ("OnePt aggregate map factory", "", "Generating factory of (DOF) map for single node aggregates.");
114  //validParamList->set< RCP<const FactoryBase> >("OnePt aggregate map factory", NoFactory::getRCP(), "Generating factory of (DOF) map for single node aggregates.");
115 
116  return validParamList;
117  }
118 
119  template <class LocalOrdinal, class GlobalOrdinal, class Node>
120  void UncoupledAggregationFactory_kokkos<LocalOrdinal, GlobalOrdinal, Node>::DeclareInput(Level& currentLevel) const {
121  Input(currentLevel, "Graph");
122  Input(currentLevel, "DofsPerNode");
123 
124  const ParameterList& pL = GetParameterList();
125 
126  // request special data necessary for OnePtAggregationAlgorithm
127  std::string mapOnePtName = pL.get<std::string>("OnePt aggregate map name");
128  if (mapOnePtName.length() > 0) {
129  std::string mapOnePtFactName = pL.get<std::string>("OnePt aggregate map factory");
130  if (mapOnePtFactName == "" || mapOnePtFactName == "NoFactory") {
131  currentLevel.DeclareInput(mapOnePtName, NoFactory::get());
132  } else {
133  RCP<const FactoryBase> mapOnePtFact = GetFactory(mapOnePtFactName);
134  currentLevel.DeclareInput(mapOnePtName, mapOnePtFact.get());
135  }
136  }
137  }
138 
139  template <class LocalOrdinal, class GlobalOrdinal, class Node>
140  void UncoupledAggregationFactory_kokkos<LocalOrdinal, GlobalOrdinal, Node>::Build(Level &currentLevel) const {
141  FactoryMonitor m(*this, "Build", currentLevel);
142 
143  ParameterList pL = GetParameterList();
144  bDefinitionPhase_ = false; // definition phase is finished, now all aggregation algorithm information is fixed
145 
146  if (pL.get<int>("aggregation: max agg size") == -1)
147  pL.set("aggregation: max agg size", INT_MAX);
148 
149  // define aggregation algorithms
150  RCP<const FactoryBase> graphFact = GetFactory("Graph");
151 
152  // TODO Can we keep different aggregation algorithms over more Build calls?
153  algos_.clear();
154  algos_.push_back(rcp(new PreserveDirichletAggregationAlgorithm_kokkos(graphFact)));
155  if (pL.get<bool>("aggregation: allow user-specified singletons") == true) algos_.push_back(rcp(new OnePtAggregationAlgorithm_kokkos (graphFact)));
156  if (pL.get<bool>("aggregation: enable phase 1" ) == true) algos_.push_back(rcp(new AggregationPhase1Algorithm_kokkos (graphFact)));
157  if (pL.get<bool>("aggregation: enable phase 2a") == true) algos_.push_back(rcp(new AggregationPhase2aAlgorithm_kokkos (graphFact)));
158  if (pL.get<bool>("aggregation: enable phase 2b") == true) algos_.push_back(rcp(new AggregationPhase2bAlgorithm_kokkos (graphFact)));
159  if (pL.get<bool>("aggregation: enable phase 3" ) == true) algos_.push_back(rcp(new AggregationPhase3Algorithm_kokkos (graphFact)));
160 
161  std::string mapOnePtName = pL.get<std::string>("OnePt aggregate map name");
162  RCP<Map> OnePtMap = Teuchos::null;
163  if (mapOnePtName.length()) {
164  std::string mapOnePtFactName = pL.get<std::string>("OnePt aggregate map factory");
165  if (mapOnePtFactName == "" || mapOnePtFactName == "NoFactory") {
166  OnePtMap = currentLevel.Get<RCP<Map> >(mapOnePtName, NoFactory::get());
167  } else {
168  RCP<const FactoryBase> mapOnePtFact = GetFactory(mapOnePtFactName);
169  OnePtMap = currentLevel.Get<RCP<Map> >(mapOnePtName, mapOnePtFact.get());
170  }
171  }
172 
173  RCP<const LWGraph_kokkos> graph = Get< RCP<LWGraph_kokkos> >(currentLevel, "Graph");
174 
175  // Build
176  RCP<Aggregates_kokkos> aggregates = rcp(new Aggregates_kokkos(*graph));
177  aggregates->setObjectLabel("UC");
178 
179  const LO numRows = graph->GetNodeNumVertices();
180 
181  // construct aggStat information
182  std::vector<unsigned> aggStat(numRows, READY);
183 
184  // TODO
185  //ArrayRCP<const bool> dirichletBoundaryMap = graph->GetBoundaryNodeMap();
186  ArrayRCP<const bool> dirichletBoundaryMap;
187 
188  if (dirichletBoundaryMap != Teuchos::null)
189  for (LO i = 0; i < numRows; i++)
190  if (dirichletBoundaryMap[i] == true)
191  aggStat[i] = BOUNDARY;
192 
193  LO nDofsPerNode = Get<LO>(currentLevel, "DofsPerNode");
194  GO indexBase = graph->GetDomainMap()->getIndexBase();
195  if (OnePtMap != Teuchos::null) {
196  for (LO i = 0; i < numRows; i++) {
197  // reconstruct global row id (FIXME only works for contiguous maps)
198  GO grid = (graph->GetDomainMap()->getGlobalElement(i)-indexBase) * nDofsPerNode + indexBase;
199 
200  for (LO kr = 0; kr < nDofsPerNode; kr++)
201  if (OnePtMap->isNodeGlobalElement(grid + kr))
202  aggStat[i] = ONEPT;
203  }
204  }
205 
206 
207  const RCP<const Teuchos::Comm<int> > comm = graph->GetComm();
208  GO numGlobalRows = 0;
209  if (IsPrint(Statistics1))
210  MueLu_sumAll(comm, as<GO>(numRows), numGlobalRows);
211 
212  LO numNonAggregatedNodes = numRows;
213  GO numGlobalAggregatedPrev = 0, numGlobalAggsPrev = 0;
214  for (size_t a = 0; a < algos_.size(); a++) {
215  std::string phase = algos_[a]->description();
216  SubFactoryMonitor sfm(*this, "Algo \"" + phase + "\"", currentLevel);
217 
218  int oldRank = algos_[a]->SetProcRankVerbose(this->GetProcRankVerbose());
219  algos_[a]->BuildAggregates(pL, *graph, *aggregates, aggStat, numNonAggregatedNodes);
220  algos_[a]->SetProcRankVerbose(oldRank);
221 
222  if (IsPrint(Statistics1)) {
223  GO numLocalAggregated = numRows - numNonAggregatedNodes, numGlobalAggregated = 0;
224  GO numLocalAggs = aggregates->GetNumAggregates(), numGlobalAggs = 0;
225  MueLu_sumAll(comm, numLocalAggregated, numGlobalAggregated);
226  MueLu_sumAll(comm, numLocalAggs, numGlobalAggs);
227 
228  double aggPercent = 100*as<double>(numGlobalAggregated)/as<double>(numGlobalRows);
229  if (aggPercent > 99.99 && aggPercent < 100.00) {
230  // Due to round off (for instance, for 140465733/140466897), we could
231  // get 100.00% display even if there are some remaining nodes. This
232  // is bad from the users point of view. It is much better to change
233  // it to display 99.99%.
234  aggPercent = 99.99;
235  }
236  GetOStream(Statistics1) << " aggregated : " << (numGlobalAggregated - numGlobalAggregatedPrev) << " (phase), " << std::fixed
237  << std::setprecision(2) << numGlobalAggregated << "/" << numGlobalRows << " [" << aggPercent << "%] (total)\n"
238  << " remaining : " << numGlobalRows - numGlobalAggregated << "\n"
239  << " aggregates : " << numGlobalAggs-numGlobalAggsPrev << " (phase), " << numGlobalAggs << " (total)" << std::endl;
240  numGlobalAggregatedPrev = numGlobalAggregated;
241  numGlobalAggsPrev = numGlobalAggs;
242  }
243  }
244 
245  TEUCHOS_TEST_FOR_EXCEPTION(numNonAggregatedNodes, Exceptions::RuntimeError, "MueLu::UncoupledAggregationFactory::Build: Leftover nodes found! Error!");
246 
247  aggregates->AggregatesCrossProcessors(false);
248 
249  Set(currentLevel, "Aggregates", aggregates);
250 
251  GetOStream(Statistics1) << aggregates->description() << std::endl;
252  }
253 
254 } //namespace MueLu
255 
256 #endif // HAVE_MUELU_KOKKOS_REFACTOR
257 #endif /* MUELU_UNCOUPLEDAGGREGATIONFACTORY_DEF_HPP_ */
#define MueLu_sumAll(rcpComm, in, out)
Print more statistics.
Namespace for MueLu classes and methods.
#define SET_VALID_ENTRY(name)