222 symmetrize (
const Teuchos::RCP<Teuchos::ParameterList> ¶ms)
227 using range_type = Kokkos::RangePolicy<execution_space, size_t>;
230 using row_ptrs_array =
typename local_graph_device_type::row_map_type::non_const_type ;
231 using col_inds_array =
typename local_graph_device_type::entries_type::non_const_type;
233 using global_col_inds_array =
typename Kokkos::View<GlobalOrdinal*, device_type>;
235 auto graph = origGraph_;
236 auto domain_map = graph->getDomainMap();
237 auto range_map = graph->getRangeMap();
238 auto row_map = graph->getRowMap();
239 auto col_map = graph->getColMap();
240 RCP<const map_type> col_map_sym;
241 RCP<const Import<LocalOrdinal,GlobalOrdinal,Node> > importer;
243 TEUCHOS_ASSERT(domain_map->isSameAs(*range_map));
244 TEUCHOS_ASSERT(domain_map->isSameAs(*row_map));
249 auto col_map_T = graphT->getColMap();
250 TEUCHOS_ASSERT(!col_map_T.is_null());
251 TEUCHOS_ASSERT(domain_map->isSameAs(*graphT->getDomainMap()));
253 bool graphSorted = graph->isSorted();
254 bool graphTSorted = graphT->isSorted();
255 bool sorted = graphSorted && graphTSorted;
256 bool matchingColMaps = col_map->isSameAs(*col_map_T);
258 auto lclGraph = graph->getLocalGraphDevice();
259 auto lclGraphT = graphT->getLocalGraphDevice();
261 using KKH_LO = KokkosKernels::Experimental::KokkosKernelsHandle<size_t, LocalOrdinal,
impl_scalar_type,
262 typename Node::execution_space,
typename Node::memory_space,
typename Node::memory_space>;
263 using KKH_GO = KokkosKernels::Experimental::KokkosKernelsHandle<size_t, GlobalOrdinal,
impl_scalar_type,
264 typename Node::execution_space,
typename Node::memory_space,
typename Node::memory_space>;
266 auto rowptrs = lclGraph.row_map;
267 auto rowptrsT = lclGraphT.row_map;
268 auto colinds = lclGraph.entries;
269 auto colindsT = lclGraphT.entries;
271 auto nrows = rowptrs.extent(0) - 1;
272 auto rowptrsSym = row_ptrs_array(Kokkos::ViewAllocateWithoutInitializing(
"row ptrs sym"), nrows + 1);
274 col_inds_array colindsSym;
276 if(!matchingColMaps) {
278 auto lclColmap = col_map->getLocalMap();
279 global_col_inds_array colindsConverted(Kokkos::ViewAllocateWithoutInitializing(
"colinds (converted)"), colinds.extent(0));
280 ConvertLocalToGlobalFunctor<GlobalOrdinal, col_inds_array, global_col_inds_array, local_map_type> convert(colinds, colindsConverted, lclColmap);
281 Kokkos::parallel_for(
"colInds (converted)", range_type(0, colinds.extent(0)), convert);
284 auto lclColmapT = col_map_T->getLocalMap();
285 global_col_inds_array colindsTConverted(Kokkos::ViewAllocateWithoutInitializing(
"colindsT (converted)"), colindsT.extent(0));
286 ConvertLocalToGlobalFunctor<GlobalOrdinal, col_inds_array, global_col_inds_array, local_map_type> convertT(colindsT, colindsTConverted, lclColmapT);
287 Kokkos::parallel_for(
"colIndsT (converted)", range_type(0, colindsT.extent(0)), convertT);
291 handle.create_spadd_handle(
false);
292 auto addHandle = handle.get_spadd_handle();
294 global_col_inds_array globalColindsSym;
296 KokkosSparse::Experimental::spadd_symbolic
297 (&handle, rowptrs, colindsConverted, rowptrsT, colindsTConverted, rowptrsSym);
298 globalColindsSym = global_col_inds_array(Kokkos::ViewAllocateWithoutInitializing(
"global colinds sym"), addHandle->get_c_nnz());
300 UnsortedNumericIndicesOnlyFunctor<
301 size_t, GlobalOrdinal,
302 typename row_ptrs_array::const_type,
typename row_ptrs_array::const_type, row_ptrs_array,
303 typename global_col_inds_array::const_type,
typename global_col_inds_array::const_type, global_col_inds_array>
304 unsortedNumeric(rowptrs, rowptrsT, rowptrsSym,
305 colindsConverted, colindsTConverted, globalColindsSym,
306 addHandle->get_a_pos(), addHandle->get_b_pos());
307 Kokkos::parallel_for(
"KokkosSparse::SpAdd:Numeric::InputNotSorted",
308 range_type(0, nrows), unsortedNumeric);
312 (col_map_sym, domain_map, globalColindsSym);
315 auto lclColmapSym = col_map_sym->getLocalMap();
316 colindsSym = col_inds_array(
"colindsSym", globalColindsSym.extent(0));
317 ConvertGlobalToLocalFunctor<LocalOrdinal, GlobalOrdinal, col_inds_array, global_col_inds_array, typename map_type::local_map_type> convertSym(colindsSym, globalColindsSym, lclColmapSym);
318 Kokkos::parallel_for(range_type(0, globalColindsSym.extent(0)), convertSym);
324 handle.create_spadd_handle(sorted);
325 auto addHandle = handle.get_spadd_handle();
327 KokkosSparse::Experimental::spadd_symbolic
328 (&handle, rowptrs, colinds, rowptrsT, colindsT, rowptrsSym);
329 colindsSym = col_inds_array(Kokkos::ViewAllocateWithoutInitializing(
"C colinds"), addHandle->get_c_nnz());
332 SortedNumericIndicesOnlyFunctor<
333 size_t, LocalOrdinal,
334 typename row_ptrs_array::const_type,
typename row_ptrs_array::const_type, row_ptrs_array,
335 typename col_inds_array::const_type,
typename col_inds_array::const_type, col_inds_array>
336 sortedNumeric(rowptrs, rowptrsT, rowptrsSym,
337 colinds, colindsT, colindsSym);
338 Kokkos::parallel_for(
"KokkosSparse::SpAdd:Numeric::InputSorted",
339 range_type(0, nrows), sortedNumeric);
342 UnsortedNumericIndicesOnlyFunctor<
343 size_t, LocalOrdinal,
344 typename row_ptrs_array::const_type,
typename row_ptrs_array::const_type, row_ptrs_array,
345 typename col_inds_array::const_type,
typename col_inds_array::const_type, col_inds_array>
346 unsortedNumeric(rowptrs, rowptrsT, rowptrsSym,
347 colinds, colindsT, colindsSym,
348 addHandle->get_a_pos(), addHandle->get_b_pos());
349 Kokkos::parallel_for(
"KokkosSparse::SpAdd:Numeric::InputNotSorted",
350 range_type(0, nrows), unsortedNumeric);
354 col_map_sym = col_map;
355 importer = graph->getImporter();
360 KokkosSparse::sort_crs_graph<execution_space, row_ptrs_array, col_inds_array>(rowptrsSym, colindsSym);
364 RCP<Teuchos::ParameterList> graphParams = Teuchos::null;
366 graphParams = rcp(
new Teuchos::ParameterList);
367 graphParams->set(
"sorted",
false);
370 return rcp (
new crs_graph_type (lclGraphSym,
433 using Teuchos::rcp_dynamic_cast;
434 using LO = LocalOrdinal;
435 using GO = GlobalOrdinal;
439#ifdef HAVE_TPETRA_MMM_TIMINGS
440 std::string prefix = std::string(
"Tpetra ") + label_ +
": ";
441 using Teuchos::TimeMonitor;
442 TimeMonitor MM (*TimeMonitor::getNewTimer (prefix +
"Transpose Local"));
445 const bool sort = [&] () {
446 constexpr bool sortDefault =
true;
447 const char sortParamName[] =
"sort";
448 return params.get () ==
nullptr ? sortDefault :
449 params->get (sortParamName, sortDefault);
456 using c_rowmap_t =
typename local_graph_device_type::row_map_type;
457 using c_entries_t =
typename local_graph_device_type::entries_type;
458 using rowmap_t =
typename local_graph_device_type::row_map_type::non_const_type;
459 using entries_t =
typename local_graph_device_type::entries_type::non_const_type;
460 LocalOrdinal numCols = origGraph_->
getColMap()->getLocalNumElements();
461 rowmap_t lclGraphT_rowmap(
"Transpose rowmap", numCols + 1);
462 entries_t lclGraphT_entries(
463 Kokkos::ViewAllocateWithoutInitializing(
"Transpose entries"), lclGraph.entries.extent(0));
464 KokkosSparse::Impl::transpose_graph<
465 c_rowmap_t, c_entries_t,
467 rowmap_t,
typename local_graph_device_type::execution_space>(
468 lclGraph.numRows(), numCols,
469 lclGraph.row_map, lclGraph.entries,
470 lclGraphT_rowmap, lclGraphT_entries);
473 KokkosSparse::sort_crs_graph<
474 typename local_graph_device_type::execution_space,
475 rowmap_t, entries_t>(
484 const auto origExport = origGraph_->getExporter ();
485 RCP<const import_type> myImport = origExport.is_null () ?
486 Teuchos::null : rcp (
new import_type (*origExport));
487 const auto origImport = origGraph_->getImporter ();
488 RCP<const export_type> myExport = origImport.is_null () ?
489 Teuchos::null : rcp (
new export_type (*origImport));
491 RCP<Teuchos::ParameterList> graphParams = Teuchos::null;
493 graphParams = rcp(
new Teuchos::ParameterList);
494 graphParams->set(
"sorted",
false);
497 return rcp (
new crs_graph_type (lclGraphT,
498 origGraph_->getColMap (),
499 origGraph_->getRowMap (),
500 origGraph_->getRangeMap (),
501 origGraph_->getDomainMap (),
502 myImport, myExport, graphParams));