61 for (
size_t i = 0; i < input.
getColMap()->getLocalNumElements(); i++) {
62 GlobalOrdinal gcid = input.
getColMap()->getGlobalElement(i);
70 std::vector<int> myUnknownDofGIDs(comm->getSize(), 0);
71 std::vector<int> numUnknownDofGIDs(comm->getSize(), 0);
72 myUnknownDofGIDs[comm->getRank()] = ovlUnknownStatusGids.
size();
73 Teuchos::reduceAll(*comm, Teuchos::REDUCE_MAX, comm->getSize(), &myUnknownDofGIDs[0], &numUnknownDofGIDs[0]);
76 size_t cntUnknownDofGIDs = 0;
77 for (
int p = 0; p < comm->getSize(); p++) cntUnknownDofGIDs += numUnknownDofGIDs[p];
78 std::vector<GlobalOrdinal> lUnknownDofGIDs(cntUnknownDofGIDs, -1);
79 std::vector<GlobalOrdinal> gUnknownDofGIDs(cntUnknownDofGIDs, -1);
81 size_t cntUnknownOffset = 0;
82 for (
int p = 0; p < comm->getRank(); p++) cntUnknownOffset += numUnknownDofGIDs[p];
83 for (
size_t k = 0; k < Teuchos::as<size_t>(ovlUnknownStatusGids.
size()); k++) {
84 lUnknownDofGIDs[k + cntUnknownOffset] = ovlUnknownStatusGids[k];
86 if (cntUnknownDofGIDs > 0)
87 Teuchos::reduceAll(*comm, Teuchos::REDUCE_MAX, Teuchos::as<int>(cntUnknownDofGIDs), &lUnknownDofGIDs[0], &gUnknownDofGIDs[0]);
88 std::sort(gUnknownDofGIDs.begin(), gUnknownDofGIDs.end());
89 gUnknownDofGIDs.erase(std::unique(gUnknownDofGIDs.begin(), gUnknownDofGIDs.end()), gUnknownDofGIDs.end());
92 for (
size_t k = 0; k < gUnknownDofGIDs.size(); k++) {
93 GlobalOrdinal curgid = gUnknownDofGIDs[k];
99 std::vector<int> myFoundDofGIDs(comm->getSize(), 0);
100 std::vector<int> numFoundDofGIDs(comm->getSize(), 0);
101 myFoundDofGIDs[comm->getRank()] = ovlFoundStatusGids.
size();
102 Teuchos::reduceAll(*comm, Teuchos::REDUCE_MAX, comm->getSize(), &myFoundDofGIDs[0], &numFoundDofGIDs[0]);
105 size_t cntFoundDofGIDs = 0;
106 for (
int p = 0; p < comm->getSize(); p++) cntFoundDofGIDs += numFoundDofGIDs[p];
107 std::vector<GlobalOrdinal> lFoundDofGIDs(cntFoundDofGIDs, -1);
108 std::vector<GlobalOrdinal> gFoundDofGIDs(cntFoundDofGIDs, -1);
110 size_t cntFoundOffset = 0;
111 for (
int p = 0; p < comm->getRank(); p++) cntFoundOffset += numFoundDofGIDs[p];
112 for (
size_t k = 0; k < Teuchos::as<size_t>(ovlFoundStatusGids.
size()); k++) {
113 lFoundDofGIDs[k + cntFoundOffset] = ovlFoundStatusGids[k];
115 if (cntFoundDofGIDs > 0)
116 Teuchos::reduceAll(*comm, Teuchos::REDUCE_MAX, Teuchos::as<int>(cntFoundDofGIDs), &lFoundDofGIDs[0], &gFoundDofGIDs[0]);
119 for (
size_t i = 0; i < input.
getColMap()->getLocalNumElements(); i++) {
120 GlobalOrdinal gcid = input.
getColMap()->getGlobalElement(i);
122 std::find(gFoundDofGIDs.begin(), gFoundDofGIDs.end(), gcid) != gFoundDofGIDs.end()) {
137 size_t numRows = rangeMapExtractor->NumMaps();
138 size_t numCols = domainMapExtractor->NumMaps();
140 TEUCHOS_TEST_FOR_EXCEPTION(rangeMapExtractor->getThyraMode() ==
true,
Xpetra::Exceptions::Incompatible,
"Xpetra::MatrixUtils::Split: RangeMapExtractor must not use Thyra style numbering of GIDs. The MapExtractor must contain all GIDs of the full range map in order to define a proper splitting.")
141 TEUCHOS_TEST_FOR_EXCEPTION(domainMapExtractor->getThyraMode() ==
true,
Xpetra::Exceptions::Incompatible,
"Xpetra::MatrixUtils::Split: DomainMapExtractor must not use Thyra style numbering of GIDs. The MapExtractor must contain all GIDs of the full domain map in order to define a proper splitting.")
153 TEUCHOS_TEST_FOR_EXCEPTION(fullDomainMap->getMaxAllGlobalIndex() != input.
getColMap()->getMaxAllGlobalIndex(),
Xpetra::Exceptions::Incompatible,
"Xpetra::MatrixUtils::Split: DomainMapExtractor incompatible to domain map of input matrix. fullDomainMap->getMaxAllGlobalIndex() = " << fullDomainMap->getMaxAllGlobalIndex() <<
" vs. input.getColMap()->getMaxAllGlobalIndex() = " << input.
getColMap()->getMaxAllGlobalIndex())
160 if (columnMapExtractor == Teuchos::null) {
163 std::vector<Teuchos::RCP<const Map>> ovlxmaps(numCols, Teuchos::null);
164 for (
size_t c = 0; c < numCols; c++) {
167 ovlxmaps[c] = colMap;
173 myColumnMapExtractor = columnMapExtractor;
180 if (bThyraMode ==
true) {
182 std::vector<Teuchos::RCP<const Map>> thyRgMapExtractorMaps(numRows, Teuchos::null);
183 for (
size_t r = 0; r < numRows; r++) {
187 if (strRangeMap != Teuchos::null) {
188 std::vector<size_t> strInfo = strRangeMap->getStridingData();
189 GlobalOrdinal offset = strRangeMap->getOffset();
190 LocalOrdinal stridedBlockId = strRangeMap->getStridedBlockId();
192 thyRgMapExtractorMaps[r] = strShrinkedMap;
194 thyRgMapExtractorMaps[r] = shrinkedMap;
200 std::vector<Teuchos::RCP<const Map>> thyDoMapExtractorMaps(numCols, Teuchos::null);
201 std::vector<Teuchos::RCP<const Map>> thyColMapExtractorMaps(numCols, Teuchos::null);
202 for (
size_t c = 0; c < numCols; c++) {
207 if (strDomainMap != Teuchos::null) {
208 std::vector<size_t> strInfo = strDomainMap->getStridingData();
209 GlobalOrdinal offset = strDomainMap->getOffset();
210 LocalOrdinal stridedBlockId = strDomainMap->getStridedBlockId();
212 thyDoMapExtractorMaps[c] = strShrinkedDomainMap;
214 thyDoMapExtractorMaps[c] = shrinkedDomainMap;
219 if (strColMap != Teuchos::null) {
220 std::vector<size_t> strInfo = strColMap->getStridingData();
221 GlobalOrdinal offset = strColMap->getOffset();
222 LocalOrdinal stridedBlockId = strColMap->getStridedBlockId();
224 thyColMapExtractorMaps[c] = strShrinkedColMap;
226 thyColMapExtractorMaps[c] = shrinkedColMap;
238 std::vector<Teuchos::RCP<Matrix>> subMatrices(numRows * numCols, Teuchos::null);
239 for (
size_t r = 0; r < numRows; r++) {
240 for (
size_t c = 0; c < numCols; c++) {
244 if (bThyraMode ==
true)
264 doCheck->putScalar(1.0);
270 doCheck->putScalar(-1.0);
271 coCheck->putScalar(-1.0);
274 for (
size_t rrr = 0; rrr < input.
getDomainMap()->getLocalNumElements(); rrr++) {
276 GlobalOrdinal
id = input.
getDomainMap()->getGlobalElement(rrr);
279 size_t BlockId = domainMapExtractor->getMapIndexForGID(
id);
281 doCheckData[rrr] = Teuchos::as<Scalar>(BlockId);
289 for (
size_t rr = 0; rr < input.
getRowMap()->getLocalNumElements(); rr++) {
291 GlobalOrdinal growid = input.
getRowMap()->getGlobalElement(rr);
300 size_t rowBlockId = rangeMapExtractor->getMapIndexForGID(growid);
303 GlobalOrdinal subblock_growid = growid;
304 if (bThyraMode ==
true) {
306 LocalOrdinal lrowid = rangeMapExtractor->getMap(rowBlockId)->getLocalElement(growid);
308 subblock_growid = thyRangeMapExtractor->getMap(rowBlockId,
true)->getGlobalElement(lrowid);
321 for (
size_t i = 0; i < (size_t)indices.
size(); i++) {
323 GlobalOrdinal gcolid = input.
getColMap()->getGlobalElement(indices[i]);
325 size_t colBlockId = myColumnMapExtractor->getMapIndexForGID(gcolid);
329 GlobalOrdinal subblock_gcolid = gcolid;
330 if (bThyraMode ==
true) {
332 LocalOrdinal lcolid = myColumnMapExtractor->getMap(colBlockId)->getLocalElement(gcolid);
334 subblock_gcolid = thyColMapExtractor->getMap(colBlockId,
true)->getGlobalElement(lcolid);
336 blockColIdx[colBlockId].push_back(subblock_gcolid);
337 blockColVals[colBlockId].push_back(vals[i]);
340 for (
size_t c = 0; c < numCols; c++) {
341 subMatrices[rowBlockId * numCols + c]->insertGlobalValues(subblock_growid, blockColIdx[c].view(0, blockColIdx[c].size()), blockColVals[c].view(0, blockColVals[c].size()));
347 if (bThyraMode ==
true) {
348 for (
size_t r = 0; r < numRows; r++) {
349 for (
size_t c = 0; c < numCols; c++) {
350 subMatrices[r * numCols + c]->fillComplete(thyDomainMapExtractor->getMap(c,
true), thyRangeMapExtractor->getMap(r,
true));
355 for (
size_t r = 0; r < numRows; r++) {
356 for (
size_t c = 0; c < numCols; c++) {
357 subMatrices[r * numCols + c]->fillComplete(domainMapExtractor->getMap(c), rangeMapExtractor->getMap(r));
363 for (
size_t r = 0; r < numRows; r++) {
364 for (
size_t c = 0; c < numCols; c++) {
365 bA->setMatrix(r, c, subMatrices[r * numCols + c]);
375 const Scalar replacementValue) {
377 using Teuchos::rcp_dynamic_cast;
379 GlobalOrdinal gZeroDiags;
380 bool usedEfficientPath =
false;
385 tpCrsAc = rcp_dynamic_cast<TpetraCrsMatrix>(crsWrapAc->getCrsMatrix());
388 auto tpCrsGraph = tpCrsAc->getTpetra_CrsMatrix()->getCrsGraph();
389 size_t numRows = Ac->getRowMap()->getLocalNumElements();
391 using range_type = Kokkos::RangePolicy<LocalOrdinal, typename Node::execution_space>;
392 auto offsets = offset_type(Kokkos::ViewAllocateWithoutInitializing(
"offsets"), numRows);
393 tpCrsGraph->getLocalDiagOffsets(offsets);
396 Tpetra::Details::OrdinalTraits<typename offset_type::value_type>::invalid();
398 if (repairZeroDiagonals) {
402 LO numMissingDiagonalEntries = 0;
404 Kokkos::parallel_reduce(
405 "countMissingDiagonalEntries",
406 range_type(0, numRows),
407 KOKKOS_LAMBDA(
const LO i,
LO& missing) {
408 missing += (offsets(i) == STINV);
410 numMissingDiagonalEntries);
412 GlobalOrdinal gNumMissingDiagonalEntries;
413 Teuchos::reduceAll(*(Ac->getRowMap()->getComm()), Teuchos::REDUCE_SUM, Teuchos::as<GlobalOrdinal>(numMissingDiagonalEntries),
414 Teuchos::outArg(gNumMissingDiagonalEntries));
416 if (gNumMissingDiagonalEntries == 0) {
419 auto lclA = tpCrsAc->getTpetra_CrsMatrix()->getLocalMatrixDevice();
421 using ATS = KokkosKernels::ArithTraits<Scalar>;
422 using impl_ATS = KokkosKernels::ArithTraits<typename ATS::val_type>;
425 typename ATS::val_type impl_replacementValue = replacementValue;
427 Kokkos::parallel_reduce(
428 "fixSmallDiagonalEntries",
429 range_type(0, numRows),
430 KOKKOS_LAMBDA(
const LO i,
LO& fixed) {
431 const auto offset = offsets(i);
432 auto curRow = lclA.row(i);
433 if (impl_ATS::magnitude(curRow.value(offset)) <= threshold) {
434 curRow.value(offset) = impl_replacementValue;
440 Teuchos::reduceAll(*(Ac->getRowMap()->getComm()), Teuchos::REDUCE_SUM, Teuchos::as<GlobalOrdinal>(lZeroDiags),
441 Teuchos::outArg(gZeroDiags));
443 usedEfficientPath =
true;
449 auto lclA = tpCrsAc->getTpetra_CrsMatrix()->getLocalMatrixDevice();
451 using ATS = KokkosKernels::ArithTraits<Scalar>;
452 using impl_ATS = KokkosKernels::ArithTraits<typename ATS::val_type>;
456 Kokkos::parallel_reduce(
457 "detectSmallDiagonalEntries",
458 range_type(0, numRows),
459 KOKKOS_LAMBDA(
const LO i,
LO& small) {
460 const auto offset = offsets(i);
464 auto curRow = lclA.row(i);
465 if (impl_ATS::magnitude(curRow.value(offset)) <= threshold) {
472 Teuchos::reduceAll(*(Ac->getRowMap()->getComm()), Teuchos::REDUCE_SUM, Teuchos::as<GlobalOrdinal>(lZeroDiags),
473 Teuchos::outArg(gZeroDiags));
475 usedEfficientPath =
true;
479 if (!usedEfficientPath) {
482 Ac->getLocalDiagCopy(*diagVec);
484 LocalOrdinal lZeroDiags = 0;
487 for (
size_t i = 0; i < rowMap->getLocalNumElements(); i++) {
488 if (TST::magnitude(diagVal[i]) <= threshold) {
493 Teuchos::reduceAll(*(rowMap->getComm()), Teuchos::REDUCE_SUM, Teuchos::as<GlobalOrdinal>(lZeroDiags),
494 Teuchos::outArg(gZeroDiags));
496 if (repairZeroDiagonals && gZeroDiags > 0) {
514 for (
size_t r = 0; r < rowMap->getLocalNumElements(); r++) {
515 if (TST::magnitude(diagVal[r]) <= threshold) {
516 GlobalOrdinal grid = rowMap->getGlobalElement(r);
518 valout[0] = replacementValue;
519 fixDiagMatrix->insertGlobalValues(grid, indout(), valout());
524 fixDiagMatrix->fillComplete(Ac->getDomainMap(), Ac->getRangeMap());
528 Xpetra::MatrixMatrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>::TwoMatrixAdd(*Ac,
false, 1.0, *fixDiagMatrix,
false, 1.0, newAc, fos);
529 if (Ac->IsView(
"stridedMaps"))
530 newAc->CreateView(
"stridedMaps", Ac);
533 fixDiagMatrix = Teuchos::null;
539 p->set(
"DoOptimizeStorage",
true);
548 fos <<
"CheckRepairMainDiagonal: " << (repairZeroDiagonals ?
"repaired " :
"found ")
549 << gZeroDiags <<
" too small entries (threshold = " << threshold <<
") on main diagonal of Ac." << std::endl;
551#ifdef HAVE_XPETRA_DEBUG
557 Ac->getLocalDiagCopy(*diagVec);
558 diagVal = diagVec->getData(0);
559 for (
size_t r = 0; r < Ac->getRowMap()->getLocalNumElements(); r++) {
560 if (TST::magnitude(diagVal[r]) <= threshold) {
561 fos <<
"Error: there are too small entries left on diagonal after repair..." << std::endl;