49 using graph_t =
typename CrsGraph::local_graph_type;
50 using matrix_t =
typename CrsMatrix::local_matrix_type;
51 using lno_view_t =
typename graph_t::row_map_type::non_const_type;
52 using lno_nnz_view_t =
typename graph_t::entries_type::non_const_type;
53 using scalar_view_t =
typename matrix_t::values_type::non_const_type;
54 using range_type = Kokkos::RangePolicy<LocalOrdinal, typename Node::execution_space>;
56 auto INVALID = Teuchos::OrdinalTraits<Xpetra::global_size_t>::invalid();
62 auto Ppattern = this->GetPattern();
81 auto lib = Ppattern->getRowMap()->lib();
85 auto comm = Ppattern->getRowMap()->getComm();
86 if (Dc.is_null() || Dc->getRowMap()->getComm()->getSize() < comm->getSize()) {
88 Kokkos::View<GlobalOrdinal*, typename Node::memory_space> dummy(
"", 0);
89 auto big_coarse_nodal_map = MapFactory::Build(lib, INVALID, dummy, 0, comm);
90 auto big_coarse_edge_map = MapFactory::Build(lib, INVALID, dummy, 0, comm);
91 auto big_coarse_nodal_colmap = MapFactory::Build(lib, INVALID, dummy, 0, comm);
93 typename Matrix::local_matrix_device_type dummyLocalMatrix;
94 big_Dc_ = MatrixFactory::Build(dummyLocalMatrix, big_coarse_edge_map, big_coarse_nodal_colmap, big_coarse_nodal_map, big_coarse_edge_map);
97 auto big_coarse_nodal_map = MapFactory::Build(lib, INVALID, Dc->getDomainMap()->getMyGlobalIndicesDevice(), 0, comm);
98 auto big_coarse_edge_map = MapFactory::Build(lib, INVALID, Dc->getRangeMap()->getMyGlobalIndicesDevice(), 0, comm);
99 auto big_coarse_nodal_colmap = MapFactory::Build(lib, INVALID, Dc->getColMap()->getMyGlobalIndicesDevice(), 0, comm);
101 big_Dc_ = MatrixFactory::Build(Dc->getLocalMatrixDevice(), big_coarse_edge_map, big_coarse_nodal_colmap, big_coarse_nodal_map, big_coarse_edge_map);
107 TEUCHOS_TEST_FOR_EXCEPTION(!D->getRangeMap()->isSameAs(*Ppattern->getRangeMap()),
109 "Maps are incompatible");
110 TEUCHOS_TEST_FOR_EXCEPTION(!big_Dc_->getRangeMap()->isSameAs(*Ppattern->getDomainMap()),
112 "Maps are incompatible");
115 RCP<const CrsGraph> auxGraph;
117 const auto one = Teuchos::ScalarTraits<Scalar>::one();
118 auto absP = MatrixFactory::Build(Ppattern);
119 absP->setAllToScalar(one);
120 absP->fillComplete();
122 auto absDc = MatrixFactory::BuildCopy(big_Dc_);
123 absDc->setAllToScalar(one);
125 auto P_Dc = MatrixMatrix::Multiply(*absP,
false, *absDc,
false, this->GetOStream(
Statistics2),
true,
true);
126 auxGraph = P_Dc->getCrsGraph();
128 RHS_pattern_ = auxGraph;
130 GlobalOrdinal indexBase = Ppattern->getRowMap()->getIndexBase();
131 const size_t numUnknowns = Ppattern->getLocalNumEntries();
132 const size_t numRows = Ppattern->getLocalNumRows();
133 Xpetra::global_size_t global_numConstraints = auxGraph->getGlobalNumEntries();
134 Xpetra::global_size_t global_numUnknowns = Ppattern->getGlobalNumEntries();
135 const size_t numConstraints = auxGraph->getLocalNumEntries();
136 auto constraint_rowmap = MapFactory::Build(lib, global_numConstraints, numConstraints, indexBase, comm);
137 auto constraint_domainmap = MapFactory::Build(lib, global_numUnknowns, numUnknowns, indexBase, comm);
139 RCP<Matrix> ghostedDc;
140 if (!Ppattern->getImporter().is_null())
141 ghostedDc = MatrixFactory::Build(big_Dc_, *Ppattern->getImporter());
147 auto lclPattern = Ppattern->getLocalGraphDevice();
148 auto lclD0 = ghostedDc->getLocalMatrixDevice();
149 auto lclAuxGraph = auxGraph->getLocalGraphDevice();
152 lno_view_t rowptr(
"constraint_rowptr", numConstraints + 2);
154 Kokkos::parallel_for(
155 "MueLu::SparseConstraint::sparse_constraint_num_entries_per_row",
156 range_type(0, numRows),
157 KOKKOS_LAMBDA(
const size_t pattern_i) {
158 for (
size_t pattern_jj = lclPattern.row_map(pattern_i); pattern_jj < lclPattern.row_map(pattern_i + 1); ++pattern_jj) {
159 auto pattern_j = lclPattern.entries(pattern_jj);
162 for (
size_t D0_jj = lclD0.graph.row_map(pattern_j); D0_jj < lclD0.graph.row_map(pattern_j + 1); ++D0_jj) {
163 auto D0_j = lclD0.graph.entries(D0_jj);
168 for (constraint_I = lclAuxGraph.row_map(pattern_i); constraint_I < lclAuxGraph.row_map(pattern_i + 1); ++constraint_I) {
169 if (lclAuxGraph.entries(constraint_I) == D0_j)
172#ifdef HAVE_MUELU_DEBUG
173 if (lclAuxGraph.entries(constraint_I) != D0_j)
174 ::Kokkos::abort(
"Did not find entry in row of tempGraph.");
179 Kokkos::atomic_add(&rowptr(constraint_I + 2), 1);
186 Kokkos::parallel_scan(
187 "MueLu::SparseConstraint::sparse_constraint_prefix_sum",
188 range_type(1, numConstraints + 2),
189 KOKKOS_LAMBDA(
const size_t constraint_i,
size_t& partial_nnz,
bool is_final) {
190 partial_nnz += rowptr(constraint_i);
192 rowptr(constraint_i) = partial_nnz;
197 lno_nnz_view_t colind(Kokkos::ViewAllocateWithoutInitializing(
"constraint_indices"), nnz);
198 scalar_view_t values(Kokkos::ViewAllocateWithoutInitializing(
"constraint_values"), nnz);
201 Kokkos::parallel_for(
202 "MueLu::SparseConstraint::sparse_constraint_fill",
203 range_type(0, numRows),
204 KOKKOS_LAMBDA(
const size_t pattern_i) {
205 for (
size_t pattern_jj = lclPattern.row_map(pattern_i); pattern_jj < lclPattern.row_map(pattern_i + 1); ++pattern_jj) {
206 auto pattern_j = lclPattern.entries(pattern_jj);
209 for (
size_t D0_jj = lclD0.graph.row_map(pattern_j); D0_jj < lclD0.graph.row_map(pattern_j + 1); ++D0_jj) {
210 auto D0_j = lclD0.graph.entries(D0_jj);
211 auto D0_val = lclD0.values(D0_jj);
216 for (constraint_I = lclAuxGraph.row_map(pattern_i); constraint_I < lclAuxGraph.row_map(pattern_i + 1); ++constraint_I) {
217 if (lclAuxGraph.entries(constraint_I) == D0_j)
220#ifdef HAVE_MUELU_DEBUG
221 if (lclAuxGraph.entries(constraint_I) != D0_j)
222 ::Kokkos::abort(
"Did not find entry in row of tempGraph.");
228 auto constraint_jj = Kokkos::atomic_fetch_inc(&rowptr(constraint_I + 1));
229 colind(constraint_jj) = pattern_jj;
230 values(constraint_jj) = D0_val;
235 auto lclConstraintGraph = graph_t(colind, Kokkos::subview(rowptr, Kokkos::make_pair(
size_t(0), numConstraints + 1)));
236 auto lclConstraint = matrix_t(
"constraint", numUnknowns, values, lclConstraintGraph);
237 X = MatrixFactory::Build(lclConstraint, constraint_rowmap, constraint_domainmap, constraint_domainmap, constraint_rowmap);
239 this->SetConstraintsMatrix(X);
244 using execution_space =
typename Node::execution_space;
245 using range_type = Kokkos::RangePolicy<LocalOrdinal, execution_space>;
247 auto lclGraph = RHS_pattern_->getLocalGraphDevice();
250 Kokkos::parallel_reduce(
251 "MueLu::SparseConstraint::FindBlocks::CountEmptyRows", range_type(0, lclGraph.numRows()), KOKKOS_LAMBDA(
const LocalOrdinal rowId,
LocalOrdinal& emptyRows) {
252 if (lclGraph.row_map(rowId + 1) == lclGraph.row_map(rowId))
257 auto numConstraints = lclGraph.entries.extent(0);
258 using graph_type =
typename CrsGraph::local_graph_type;
259 typename graph_type::row_map_type::non_const_type rowptr(
"blocks_rowptr", lclGraph.numRows() + 1 - numEmptyRows);
260 typename graph_type::entries_type::non_const_type indices(
"blocks_indices", numConstraints);
262 Kokkos::parallel_scan(
263 "MueLu::SparseConstraint::FindBlocks::GenerateBlockRowPtr", range_type(0, lclGraph.numRows()), KOKKOS_LAMBDA(
const LocalOrdinal rowId,
LocalOrdinal& rowIdNew,
const bool is_final) {
264 if (lclGraph.row_map(rowId + 1) != lclGraph.row_map(rowId)) {
266 rowptr(rowIdNew + 1) = lclGraph.row_map(rowId + 1);
271 Kokkos::parallel_for(
272 "MueLu::SparseConstraint::FindBlocks::FillBlockIndices", range_type(0, numConstraints), KOKKOS_LAMBDA(
const LocalOrdinal constraintId) {
273 indices(constraintId) = constraintId;
276 return graph_type(indices, rowptr);