MueLu Version of the Day
Loading...
Searching...
No Matches
MueLu_Zoltan2Interface_def.hpp
Go to the documentation of this file.
1// @HEADER
2//
3// ***********************************************************************
4//
5// MueLu: A package for multigrid based preconditioning
6// Copyright 2012 Sandia Corporation
7//
8// Under the terms of Contract DE-AC04-94AL85000 with Sandia Corporation,
9// the U.S. Government retains certain rights in this software.
10//
11// Redistribution and use in source and binary forms, with or without
12// modification, are permitted provided that the following conditions are
13// met:
14//
15// 1. Redistributions of source code must retain the above copyright
16// notice, this list of conditions and the following disclaimer.
17//
18// 2. Redistributions in binary form must reproduce the above copyright
19// notice, this list of conditions and the following disclaimer in the
20// documentation and/or other materials provided with the distribution.
21//
22// 3. Neither the name of the Corporation nor the names of the
23// contributors may be used to endorse or promote products derived from
24// this software without specific prior written permission.
25//
26// THIS SOFTWARE IS PROVIDED BY SANDIA CORPORATION "AS IS" AND ANY
27// EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
28// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
29// PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL SANDIA CORPORATION OR THE
30// CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
31// EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
32// PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
33// PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
34// LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
35// NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
36// SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
37//
38// Questions? Contact
39// Jonathan Hu (jhu@sandia.gov)
40// Andrey Prokopenko (aprokop@sandia.gov)
41// Ray Tuminaro (rstumin@sandia.gov)
42//
43// ***********************************************************************
44//
45// @HEADER
46#ifndef MUELU_ZOLTAN2INTERFACE_DEF_HPP
47#define MUELU_ZOLTAN2INTERFACE_DEF_HPP
48
49#include <sstream>
50#include <set>
51
53#if defined(HAVE_MUELU_ZOLTAN2) && defined(HAVE_MPI)
54
55#include <Zoltan2_XpetraMultiVectorAdapter.hpp>
56#include <Zoltan2_XpetraCrsGraphAdapter.hpp>
57#include <Zoltan2_PartitioningProblem.hpp>
58
59#include <Teuchos_Utils.hpp>
60#include <Teuchos_DefaultMpiComm.hpp>
61#include <Teuchos_OpaqueWrapper.hpp>
62
63#include "MueLu_Level.hpp"
64#include "MueLu_Exceptions.hpp"
65#include "MueLu_Monitor.hpp"
66
67namespace MueLu {
68
69 template <class Scalar, class LocalOrdinal, class GlobalOrdinal, class Node>
71 defaultZoltan2Params = rcp(new ParameterList());
72 defaultZoltan2Params->set("algorithm", "multijagged");
73 defaultZoltan2Params->set("partitioning_approach", "partition");
74
75 // Improve scaling for communication bound algorithms by premigrating
76 // coordinates to a subset of processors.
77 // For more information, see Github issue #1538
78 defaultZoltan2Params->set("mj_premigration_option", 1);
79 }
80
81 template <class Scalar, class LocalOrdinal, class GlobalOrdinal, class Node>
83 RCP<ParameterList> validParamList = rcp(new ParameterList());
84
85 validParamList->set< RCP<const FactoryBase> > ("A", Teuchos::null, "Factory of the matrix A");
86 validParamList->set< RCP<const FactoryBase> > ("number of partitions", Teuchos::null, "Instance of RepartitionHeuristicFactory.");
87 validParamList->set< RCP<const FactoryBase> > ("Coordinates", Teuchos::null, "Factory of the coordinates");
88 validParamList->set< RCP<const ParameterList> > ("ParameterList", Teuchos::null, "Zoltan2 parameters");
89 validParamList->set< RCP<const FactoryBase> > ("repartition: heuristic target rows per process", Teuchos::null, "Factory for number of rows per process to use with MultiJagged");
90
91 return validParamList;
92 }
93
94
95 template <class Scalar, class LocalOrdinal, class GlobalOrdinal, class Node>
97 Input(currentLevel, "A");
98 Input(currentLevel, "number of partitions");
99 const ParameterList& pL = GetParameterList();
100 // We do this dance, because we don't want "ParameterList" to be marked as used.
101 // Is there a better way?
102 Teuchos::ParameterEntry entry = pL.getEntry("ParameterList");
103 RCP<const Teuchos::ParameterList> providedList = Teuchos::any_cast<RCP<const Teuchos::ParameterList> >(entry.getAny(false));
104 if (providedList != Teuchos::null && providedList->isType<std::string>("algorithm")) {
105 const std::string algo = providedList->get<std::string>("algorithm");
106 if (algo == "multijagged") {
107 Input(currentLevel, "Coordinates");
108 Input(currentLevel, "repartition: heuristic target rows per process");
109 } else if (algo == "rcb") {
110 Input(currentLevel, "Coordinates");
111 }
112 } else {
113 Input(currentLevel, "repartition: heuristic target rows per process");
114 Input(currentLevel, "Coordinates");
115 }
116 }
117
118 template <class Scalar, class LocalOrdinal, class GlobalOrdinal, class Node>
120 FactoryMonitor m(*this, "Build", level);
121
122 typedef typename Teuchos::ScalarTraits<SC>::coordinateType real_type;
123 typedef typename Xpetra::MultiVector<real_type,LO,GO,NO> RealValuedMultiVector;
124
125 RCP<Matrix> A = Get<RCP<Matrix> >(level, "A");
126 RCP<const Map> rowMap = A->getRowMap();
127 LO blkSize = A->GetFixedBlockSize();
128
129 int numParts = Get<int>(level, "number of partitions");
130 if (numParts == 1 || numParts == -1) {
131 // Single processor, decomposition is trivial: all zeros
132 RCP<Xpetra::Vector<GO,LO,GO,NO> > decomposition = Xpetra::VectorFactory<GO, LO, GO, NO>::Build(rowMap, true);
133 Set(level, "Partition", decomposition);
134 return;
135 }/* else if (numParts == -1) {
136 // No repartitioning
137 RCP<Xpetra::Vector<GO,LO,GO,NO> > decomposition = Teuchos::null; //Xpetra::VectorFactory<GO, LO, GO, NO>::Build(rowMap, true);
138 //decomposition->putScalar(Teuchos::as<Scalar>(rowMap->getComm()->getRank()));
139 Set(level, "Partition", decomposition);
140 return;
141 }*/
142
143 const ParameterList& pL = GetParameterList();
144
145 RCP<const ParameterList> providedList = pL.get<RCP<const ParameterList> >("ParameterList");
146 ParameterList Zoltan2Params;
147 if (providedList != Teuchos::null)
148 Zoltan2Params = *providedList;
149
150 // Merge defalt Zoltan2 parameters with user provided
151 // If default and user parameters contain the same parameter name, user one is always preferred
152 for (ParameterList::ConstIterator param = defaultZoltan2Params->begin(); param != defaultZoltan2Params->end(); param++) {
153 const std::string& pName = defaultZoltan2Params->name(param);
154 if (!Zoltan2Params.isParameter(pName))
155 Zoltan2Params.setEntry(pName, defaultZoltan2Params->getEntry(pName));
156 }
157 Zoltan2Params.set("num_global_parts", Teuchos::as<int>(numParts));
158
159 GetOStream(Runtime0) << "Zoltan2 parameters:\n----------\n" << Zoltan2Params << "----------" << std::endl;
160
161 const std::string& algo = Zoltan2Params.get<std::string>("algorithm");
162
163 if (algo == "multijagged" || algo == "rcb") {
164
165 RCP<RealValuedMultiVector> coords = Get<RCP<RealValuedMultiVector> >(level, "Coordinates");
166 RCP<const Map> map = coords->getMap();
167 GO numElements = map->getLocalNumElements();
168
169 // Check that the number of local coordinates is consistent with the #rows in A
170 TEUCHOS_TEST_FOR_EXCEPTION(rowMap->getLocalNumElements()/blkSize != coords->getLocalLength(), Exceptions::Incompatible,
171 "Coordinate vector length (" + toString(coords->getLocalLength()) << " is incompatible with number of block rows in A ("
172 + toString(rowMap->getLocalNumElements()/blkSize) + "The vector length should be the same as the number of mesh points.");
173#ifdef HAVE_MUELU_DEBUG
174 GO indexBase = rowMap->getIndexBase();
175 GetOStream(Runtime0) << "Checking consistence of row and coordinates maps" << std::endl;
176 // Make sure that logical blocks in row map coincide with logical nodes in coordinates map
177 ArrayView<const GO> rowElements = rowMap->getLocalElementList();
178 ArrayView<const GO> coordsElements = map ->getLocalElementList();
179 for (LO i = 0; i < Teuchos::as<LO>(numElements); i++)
180 TEUCHOS_TEST_FOR_EXCEPTION((coordsElements[i]-indexBase)*blkSize + indexBase != rowElements[i*blkSize],
181 Exceptions::RuntimeError, "i = " << i << ", coords GID = " << coordsElements[i]
182 << ", row GID = " << rowElements[i*blkSize] << ", blkSize = " << blkSize << std::endl);
183#endif
184
185 typedef Zoltan2::XpetraMultiVectorAdapter<RealValuedMultiVector> InputAdapterType;
186 typedef Zoltan2::PartitioningProblem<InputAdapterType> ProblemType;
187
188 Array<real_type> weightsPerRow(numElements);
189 for (LO i = 0; i < numElements; i++) {
190 weightsPerRow[i] = 0.0;
191
192 for (LO j = 0; j < blkSize; j++) {
193 weightsPerRow[i] += A->getNumEntriesInLocalRow(i*blkSize+j);
194 }
195 }
196
197 // MultiJagged: Grab the target rows per process from the Heuristic to use unless the Zoltan2 list says otherwise
198 if(algo == "multijagged" && !Zoltan2Params.isParameter("mj_premigration_coordinate_count")) {
199 LO heuristicTargetRowsPerProcess = Get<LO>(level,"repartition: heuristic target rows per process");
200 Zoltan2Params.set("mj_premigration_coordinate_count", heuristicTargetRowsPerProcess);
201 }
202 const bool writeZoltan2DebuggingFiles = Zoltan2Params.get("mj_debug",false);
203 Zoltan2Params.remove("mj_debug");
204
205 std::vector<int> strides;
206 std::vector<const real_type*> weights(1, weightsPerRow.getRawPtr());
207
208 RCP<const Teuchos::MpiComm<int> > dupMpiComm = rcp_dynamic_cast<const Teuchos::MpiComm<int> >(rowMap->getComm()->duplicate());
209 RCP<const Teuchos::OpaqueWrapper<MPI_Comm> > zoltanComm = dupMpiComm->getRawMpiComm();
210
211 InputAdapterType adapter(coords, weights, strides);
212 RCP<ProblemType> problem(new ProblemType(&adapter, &Zoltan2Params, (*zoltanComm)()));
213
214 {
215 SubFactoryMonitor m1(*this, "Zoltan2 " + toString(algo), level);
216 if (writeZoltan2DebuggingFiles)
217 adapter.generateFiles(("mj_debug.lvl_"+std::to_string(level.GetLevelID())).c_str(), *(rowMap->getComm()));
218 problem->solve();
219 }
220
221 RCP<Xpetra::Vector<GO,LO,GO,NO> > decomposition = Xpetra::VectorFactory<GO,LO,GO,NO>::Build(rowMap, false);
222 ArrayRCP<GO> decompEntries = decomposition->getDataNonConst(0);
223
224 const typename InputAdapterType::part_t * parts = problem->getSolution().getPartListView();
225
226 for (GO i = 0; i < numElements; i++) {
227 int partNum = parts[i];
228
229 for (LO j = 0; j < blkSize; j++)
230 decompEntries[i*blkSize + j] = partNum;
231 }
232
233 Set(level, "Partition", decomposition);
234
235 } else {
236
237 GO numElements = rowMap->getLocalNumElements();
238
239 typedef Zoltan2::XpetraCrsGraphAdapter<CrsGraph> InputAdapterType;
240 typedef Zoltan2::PartitioningProblem<InputAdapterType> ProblemType;
241
242 RCP<const Teuchos::MpiComm<int> > dupMpiComm = rcp_dynamic_cast<const Teuchos::MpiComm<int> >(rowMap->getComm()->duplicate());
243 RCP<const Teuchos::OpaqueWrapper<MPI_Comm> > zoltanComm = dupMpiComm->getRawMpiComm();
244
245 InputAdapterType adapter(A->getCrsGraph());
246 RCP<ProblemType> problem(new ProblemType(&adapter, &Zoltan2Params, (*zoltanComm)()));
247
248 {
249 SubFactoryMonitor m1(*this, "Zoltan2 " + toString(algo), level);
250 problem->solve();
251 }
252
253 RCP<Xpetra::Vector<GO,LO,GO,NO> > decomposition = Xpetra::VectorFactory<GO,LO,GO,NO>::Build(rowMap, false);
254 ArrayRCP<GO> decompEntries = decomposition->getDataNonConst(0);
255
256 const typename InputAdapterType::part_t * parts = problem->getSolution().getPartListView();
257
258 // For blkSize > 1, ignore solution for every row but the first ones in a block.
259 for (GO i = 0; i < numElements/blkSize; i++) {
260 int partNum = parts[i*blkSize];
261
262 for (LO j = 0; j < blkSize; j++)
263 decompEntries[i*blkSize + j] = partNum;
264 }
265
266 Set(level, "Partition", decomposition);
267 }
268 }
269
270} //namespace MueLu
271
272#endif //if defined(HAVE_MUELU_ZOLTAN2) && defined(HAVE_MPI)
273
274#endif // MUELU_ZOLTAN2INTERFACE_DEF_HPP
Exception throws to report incompatible objects (like maps).
Exception throws to report errors in the internal logical of the program.
Timer to be used in factories. Similar to Monitor but with additional timers.
void Input(Level &level, const std::string &varName) const
T Get(Level &level, const std::string &varName) const
void Set(Level &level, const std::string &varName, const T &data) const
Class that holds all level-specific information.
virtual const Teuchos::ParameterList & GetParameterList() const
Timer to be used in factories. Similar to SubMonitor but adds a timer level by level.
Teuchos::FancyOStream & GetOStream(MsgType type, int thisProcRankOnly=0) const
Get an output stream for outputting the input message type.
void DeclareInput(Level &currentLevel) const
Specifies the data that this class needs, and the factories that generate that data.
RCP< const ParameterList > GetValidParameterList() const
Return a const parameter list of valid parameters that setParameterList() will accept.
void Build(Level &currentLevel) const
Build an object with this factory.
Namespace for MueLu classes and methods.
@ Runtime0
One-liner description of what is happening.
std::string toString(const T &what)
Little helper function to convert non-string types to strings.