10#ifndef TPETRA_DETAILS_CRSUTILS_HPP
11#define TPETRA_DETAILS_CRSUTILS_HPP
15#include "TpetraCore_config.h"
16#include "Kokkos_Core.hpp"
18#include "Tpetra_Details_CrsPadding.hpp"
19#include "Tpetra_Details_WrappedDualView.hpp"
22#include <unordered_map>
36template <
class ViewType>
38make_uninitialized_view(
39 const std::string& name,
42 const std::string*
const prefix) {
44 std::ostringstream os;
45 os << *prefix <<
"Allocate Kokkos::View " << name
46 <<
": " << size << std::endl;
47 std::cerr << os.str();
49 using Kokkos::view_alloc;
50 using Kokkos::WithoutInitializing;
51 return ViewType(view_alloc(name, WithoutInitializing), size);
54template <
class ViewType>
57 const std::string& name,
60 const std::string*
const prefix) {
62 std::ostringstream os;
63 os << *prefix <<
"Allocate & initialize Kokkos::View "
64 << name <<
": " << size << std::endl;
65 std::cerr << os.str();
67 return ViewType(name, size);
70template <
class OutViewType,
class InViewType>
71void assign_to_view(OutViewType& out,
73 const char viewName[],
75 const std::string*
const prefix) {
77 std::ostringstream os;
78 os << *prefix <<
"Assign to Kokkos::View " << viewName
79 <<
": Old size: " << out.extent(0)
80 <<
", New size: " << in.extent(0) << std::endl;
81 std::cerr << os.str();
86template <
class MemorySpace,
class ViewType>
87auto create_mirror_view(
88 const MemorySpace& memSpace,
91 const std::string*
const prefix) ->
decltype(Kokkos::create_mirror_view(memSpace, view)) {
93 std::ostringstream os;
94 os << *prefix <<
"Create mirror view: "
95 <<
"view.extent(0): " << view.extent(0) << std::endl;
96 std::cerr << os.str();
98 return Kokkos::create_mirror_view(memSpace, view);
101enum class PadCrsAction {
119template <
class RowPtr,
class Indices,
class Values,
class Padding>
121 const PadCrsAction
action,
128 const bool verbose) {
129 using execution_space =
typename Indices::t_dev::execution_space;
130 using Kokkos::view_alloc;
131 using Kokkos::WithoutInitializing;
133 std::unique_ptr<std::string>
prefix;
137 std::ostringstream
os;
138 os <<
"Proc " <<
my_rank <<
": Tpetra::...::pad_crs_arrays: ";
139 prefix = std::unique_ptr<std::string>(
new std::string(
os.str()));
141 std::cerr <<
os.str();
146 std::ostringstream
os;
162 <<
", values.extent(0): " <<
values_wdv.extent(0)
166 std::cerr <<
os.str();
171 std::ostringstream
os;
172 os << *
prefix <<
"Done; local matrix has no rows" <<
endl;
173 std::cerr <<
os.str();
183 std::ostringstream
os;
184 os << *
prefix <<
"Fill newAllocPerRow & compute increase" <<
endl;
185 std::cerr <<
os.str();
211 Kokkos::DefaultHostExecutionSpace,
size_t>;
212 Kokkos::parallel_reduce(
213 "Tpetra::CrsGraph: Compute new allocation size per row",
240 std::ostringstream
os;
245 std::cerr <<
os.str();
256 typename Indices::t_dev::non_const_value_type;
263 "Tpetra::CrsGraph column indices",
newIndsSize, verbose,
268 if (
action == PadCrsAction::INDICES_AND_VALUES) {
277 std::ostringstream
os;
279 std::cerr <<
os.str();
282 using range_type = Kokkos::RangePolicy<execution_space, size_t>;
283 Kokkos::parallel_scan(
284 "Tpetra::CrsGraph or CrsMatrix repack",
285 range_type(
size_t(0),
size_t(
lclNumRows + 1)),
299 const Kokkos::pair<size_t, size_t>
oldRange(
301 const Kokkos::pair<size_t, size_t>
newRange(
309 if (
action == PadCrsAction::INDICES_AND_VALUES) {
327 std::ostringstream
os;
347 std::cout <<
os.str();
357 std::ostringstream
os;
368 std::ostringstream
os;
370 std::cerr <<
os.str();
375template <
class Po
inters,
class InOutIndices,
class InIndices,
class IndexMap>
378 typename Pointers::value_type
const row,
384 std::function<
void(
size_t const,
size_t const,
size_t const)>
cb) {
391 return Teuchos::OrdinalTraits<size_t>::invalid();
394 using offset_type =
typename std::decay<
decltype(
row_ptrs[0])>::type;
397 const offset_type start =
row_ptrs[row];
422 return Teuchos::OrdinalTraits<size_t>::invalid();
449 return Teuchos::OrdinalTraits<size_t>::invalid();
470template <
class Po
inters,
class Indices1,
class Indices2,
class IndexMap,
class Callback>
473 typename Pointers::value_type
const row,
484 typename std::remove_const<typename Indices1::value_type>::type;
487 const size_t start =
static_cast<size_t>(
row_ptrs[row]);
498 std::forward<Callback>(
cb)(
k, start,
off);
507template <
class Po
inters,
class Indices1,
class Indices2,
class IndexMap,
class Callback>
509 typename Pointers::value_type
const row,
519 using ordinal =
typename std::remove_const<typename Indices1::value_type>::type;
522 const size_t start =
static_cast<size_t>(
row_ptrs[row]);
536 std::forward<Callback>(
cb)(
k, start,
off);
564template <
class RowPtr,
class Indices,
class Padding>
571 const bool verbose) {
572 using impl::pad_crs_arrays;
580template <
class RowPtr,
class Indices,
class Values,
class Padding>
588 const bool verbose) {
589 using impl::pad_crs_arrays;
639template <
class Po
inters,
class InOutIndices,
class InIndices>
642 typename Pointers::value_type
const row,
647 std::function<
void(
const size_t,
const size_t,
const size_t)>
cb =
648 std::function<
void(
const size_t,
const size_t,
const size_t)>()) {
649 static_assert(std::is_same<typename std::remove_const<typename InOutIndices::value_type>::type,
650 typename std::remove_const<typename InIndices::value_type>::type>::value,
651 "Expected views to have same value type");
654 using ordinal =
typename InOutIndices::value_type;
661template <
class Po
inters,
class InOutIndices,
class InIndices>
664 typename Pointers::value_type
const row,
669 std::function<
typename InOutIndices::value_type(
const typename InIndices::value_type)>
map,
670 std::function<
void(
const size_t,
const size_t,
const size_t)>
cb =
671 std::function<
void(
const size_t,
const size_t,
const size_t)>()) {
706template <
class Po
inters,
class Indices1,
class Indices2,
class Callback>
709 typename Pointers::value_type
const row,
715 static_assert(std::is_same<typename std::remove_const<typename Indices1::value_type>::type,
716 typename std::remove_const<typename Indices2::value_type>::type>::value,
717 "Expected views to have same value type");
719 using ordinal =
typename Indices2::value_type;
720 auto numFound = impl::find_crs_indices(
726template <
class Po
inters,
class Indices1,
class Indices2,
class IndexMap,
class Callback>
729 typename Pointers::value_type
const row,
739template <
class Po
inters,
class Indices1,
class Indices2,
class IndexMap,
class Callback>
740size_t findCrsIndicesSorted(
741 typename Pointers::value_type
const row,
742 Pointers
const& rowPtrs,
743 const size_t curNumEntries,
744 Indices1
const& curIndices,
745 Indices2
const& newIndices,
748 return impl::find_crs_indices_sorted(row, rowPtrs, curNumEntries, curIndices, newIndices, map, cb);
Declaration of Tpetra::Details::Behavior, a class that describes Tpetra's behavior.
void pad_crs_arrays(const PadCrsAction action, const RowPtr &row_ptr_beg, const RowPtr &row_ptr_end, Indices &indices_wdv, Values &values_wdv, const Padding &padding, const int my_rank, const bool verbose)
Implementation of padCrsArrays.
size_t find_crs_indices(typename Pointers::value_type const row, Pointers const &row_ptrs, const size_t curNumEntries, Indices1 const &cur_indices, Indices2 const &new_indices, IndexMap &&map, Callback &&cb)
Implementation of findCrsIndices.
size_t find_crs_indices_sorted(typename Pointers::value_type const row, Pointers const &row_ptrs, const size_t curNumEntries, Indices1 const &cur_indices, Indices2 const &new_indices, IndexMap &&map, Callback &&cb)
Implementation of findCrsIndices.
size_t insert_crs_indices(typename Pointers::value_type const row, Pointers const &row_ptrs, InOutIndices &cur_indices, size_t &num_assigned, InIndices const &new_indices, IndexMap &&map, std::function< void(size_t const, size_t const, size_t const)> cb)
Implementation of insertCrsIndices.
Struct that holds views of the contents of a CrsMatrix.
static size_t verbosePrintCountThreshold()
Number of entries below which arrays, lists, etc. will be printed in debug mode.
Implementation details of Tpetra.
void padCrsArrays(const RowPtr &rowPtrBeg, const RowPtr &rowPtrEnd, Indices &indices_wdv, const Padding &padding, const int my_rank, const bool verbose)
Determine if the row pointers and indices arrays need to be resized to accommodate new entries....
void verbosePrintArray(std::ostream &out, const ArrayType &x, const char name[], const size_t maxNumToPrint)
Print min(x.size(), maxNumToPrint) entries of x.
size_t insertCrsIndices(typename Pointers::value_type const row, Pointers const &rowPtrs, InOutIndices &curIndices, size_t &numAssigned, InIndices const &newIndices, std::function< void(const size_t, const size_t, const size_t)> cb=std::function< void(const size_t, const size_t, const size_t)>())
Insert new indices in to current list of indices.
size_t findCrsIndices(typename Pointers::value_type const row, Pointers const &rowPtrs, const size_t curNumEntries, Indices1 const &curIndices, Indices2 const &newIndices, Callback &&cb)
Finds offsets in to current list of indices.
Namespace Tpetra contains the class and methods constituting the Tpetra library.