457 regSum(rowIdx) += local_mat_dev.values(entryIdx);
458 if (KAT_M::zero() < KAT_S::abs(local_mat_dev.values(entryIdx))) {
461 diag_dev(rowIdx, 0) += KAT_S::abs(local_mat_dev.values(entryIdx));
462 if (rowIdx == local_mat_dev.graph.entries(entryIdx)) {
463 Kokkos::atomic_add(&avgAbsDiagVal_dev(), KAT_S::abs(local_mat_dev.values(entryIdx)));
467 if (nnzPerRow(rowIdx) == 1 && KAT_S::magnitude(diag_dev(rowIdx, 0)) == KAT_M::one()) {
468 Kokkos::atomic_add(&numDiagsEqualToOne_dev(), 1);
472 if (useAverageAbsDiagVal) {
473 Teuchos::TimeMonitor MMM = *Teuchos::TimeMonitor::getNewTimer(
"GetLumpedMatrixDiagonal: useAverageAbsDiagVal");
474 typename Kokkos::View<mag_type, execution_space>::HostMirror avgAbsDiagVal = Kokkos::create_mirror_view(avgAbsDiagVal_dev);
475 Kokkos::deep_copy(avgAbsDiagVal, avgAbsDiagVal_dev);
476 int numDiagsEqualToOne;
477 Kokkos::deep_copy(numDiagsEqualToOne, numDiagsEqualToOne_dev);
479 tol = TST::magnitude(100 * Teuchos::ScalarTraits<Scalar>::eps()) * (avgAbsDiagVal() - numDiagsEqualToOne) / (rowMap->getLocalNumElements() - numDiagsEqualToOne);
483 Teuchos::TimeMonitor MMM = *Teuchos::TimeMonitor::getNewTimer(
"ComputeLumpedDiagonalInverse: parallel_for (doReciprocal)");
484 Kokkos::parallel_for(
485 "ComputeLumpedDiagonalInverse", my_policy,
486 KOKKOS_LAMBDA(
const int rowIdx) {
487 if (replaceSingleEntryRowWithZero && nnzPerRow(rowIdx) <= 1) {
488 diag_dev(rowIdx, 0) = KAT_S::zero();
489 }
else if ((diag_dev(rowIdx, 0) != KAT_S::zero()) && (KAT_S::magnitude(diag_dev(rowIdx, 0)) < KAT_S::magnitude(2 * regSum(rowIdx)))) {
490 diag_dev(rowIdx, 0) = KAT_S::one() / KAT_S::magnitude(2 * regSum(rowIdx));
492 if (KAT_S::magnitude(diag_dev(rowIdx, 0)) > tol) {
493 diag_dev(rowIdx, 0) = KAT_S::one() / diag_dev(rowIdx, 0);
495 diag_dev(rowIdx, 0) = valReplacement_dev;
502 Teuchos::TimeMonitor MMM = *Teuchos::TimeMonitor::getNewTimer(
"GetLumpedMatrixDiagonal: parallel_for");
503 Kokkos::parallel_for(
504 "GetLumpedMatrixDiagonal", my_policy,
505 KOKKOS_LAMBDA(
const int rowIdx) {
506 diag_dev(rowIdx, 0) = KAT_S::zero();
507 for (size_type entryIdx = local_mat_dev.graph.row_map(rowIdx);
508 entryIdx < local_mat_dev.graph.row_map(rowIdx + 1);
510 diag_dev(rowIdx, 0) += KAT_S::magnitude(local_mat_dev.values(entryIdx));
516 Teuchos::TimeMonitor MMM = *Teuchos::TimeMonitor::getNewTimer(
"UtilitiesBase: GetLumpedMatrixDiagonal: (Teuchos implementation)");
517 ArrayRCP<Scalar> diagVals = diag->getDataNonConst(0);
518 Teuchos::Array<Scalar> regSum(diag->getLocalLength());
519 Teuchos::ArrayView<const LocalOrdinal> cols;
520 Teuchos::ArrayView<const Scalar> vals;
522 std::vector<int> nnzPerRow(rowMap->getLocalNumElements());
527 const Magnitude zeroMagn = TST::magnitude(zero);
528 Magnitude avgAbsDiagVal = TST::magnitude(zero);
529 int numDiagsEqualToOne = 0;
530 for (
size_t i = 0; i < rowMap->getLocalNumElements(); ++i) {
532 rcpA->getLocalRowView(i, cols, vals);
535 regSum[i] += vals[j];
536 const Magnitude rowEntryMagn = TST::magnitude(vals[j]);
537 if (rowEntryMagn > zeroMagn)
539 diagVals[i] += rowEntryMagn;
540 if (
static_cast<size_t>(cols[j]) == i)
541 avgAbsDiagVal += rowEntryMagn;
543 if (nnzPerRow[i] == 1 && TST::magnitude(diagVals[i]) == 1.)
544 numDiagsEqualToOne++;
546 if (useAverageAbsDiagVal)
547 tol = TST::magnitude(100 * Teuchos::ScalarTraits<Scalar>::eps()) * (avgAbsDiagVal - numDiagsEqualToOne) / (rowMap->getLocalNumElements() - numDiagsEqualToOne);
549 for (
size_t i = 0; i < rowMap->getLocalNumElements(); ++i) {
550 if (replaceSingleEntryRowWithZero && nnzPerRow[i] <=
static_cast<int>(1))
552 else if ((diagVals[i] != zero) && (TST::magnitude(diagVals[i]) < TST::magnitude(two * regSum[i])))
553 diagVals[i] = one / TST::magnitude((two * regSum[i]));
555 if (TST::magnitude(diagVals[i]) > tol)
556 diagVals[i] = one / diagVals[i];
558 diagVals[i] = valReplacement;
565 TEUCHOS_TEST_FOR_EXCEPTION(doReciprocal, Xpetra::Exceptions::RuntimeError,
566 "UtilitiesBase::GetLumpedMatrixDiagonal(): extracting reciprocal of diagonal of a blocked matrix is not supported");
567 diag = Xpetra::VectorFactory<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Build(bA->getRangeMapExtractor()->getFullMap(),
true);
569 for (
size_t row = 0; row < bA->Rows(); ++row) {
570 for (
size_t col = 0; col < bA->Cols(); ++col) {
571 if (!bA->getMatrix(row, col).is_null()) {
573 bool bThyraMode = bA->getRangeMapExtractor()->getThyraMode() && (Teuchos::rcp_dynamic_cast<Xpetra::BlockedCrsMatrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>>(bA->getMatrix(row, col)) == Teuchos::null);
574 RCP<Vector> ddtemp = bA->getRangeMapExtractor()->ExtractVector(diag, row, bThyraMode);
575 RCP<const Vector> dd = GetLumpedMatrixDiagonal(*(bA->getMatrix(row, col)));
576 ddtemp->update(Teuchos::as<Scalar>(1.0), *dd, Teuchos::as<Scalar>(1.0));
577 bA->getRangeMapExtractor()->InsertVector(ddtemp, row, diag, bThyraMode);
586template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
587Teuchos::RCP<Xpetra::Vector<Scalar, LocalOrdinal, GlobalOrdinal, Node>>
591 RCP<const Map> rowMap = A.getRowMap();
592 auto diag = Xpetra::VectorFactory<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Build(rowMap,
false);
595 using local_vector_type =
typename Vector::dual_view_type::t_dev_um;
596 using local_matrix_type =
typename Matrix::local_matrix_type;
597 using execution_space =
typename local_vector_type::execution_space;
598 using values_type =
typename local_matrix_type::values_type;
599 using scalar_type =
typename values_type::non_const_value_type;
600 using KAT_S =
typename Kokkos::ArithTraits<scalar_type>;
602 auto diag_dev = diag->getDeviceLocalView(Xpetra::Access::OverwriteAll);
603 auto local_mat_dev = A.getLocalMatrixDevice();
604 Kokkos::RangePolicy<execution_space, int> my_policy(0,
static_cast<int>(diag_dev.extent(0)));
606 Kokkos::parallel_for(
607 "GetMatrixMaxMinusOffDiagonal", my_policy,
609 auto mymax = KAT_S::zero();
610 auto row = local_mat_dev.rowConst(rowIdx);
611 for (
LocalOrdinal entryIdx = 0; entryIdx < row.length; ++entryIdx) {
612 if (rowIdx != row.colidx(entryIdx)) {
613 if (KAT_S::real(mymax) < -KAT_S::real(row.value(entryIdx)))
614 mymax = -KAT_S::real(row.value(entryIdx));
617 diag_dev(rowIdx, 0) = mymax;
623template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
624Teuchos::RCP<Xpetra::Vector<Scalar, LocalOrdinal, GlobalOrdinal, Node>>
626 GetMatrixMaxMinusOffDiagonal(
const Xpetra::Matrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>& A,
const Xpetra::Vector<LocalOrdinal, LocalOrdinal, GlobalOrdinal, Node>& BlockNumber) {
627 TEUCHOS_TEST_FOR_EXCEPTION(!A.getColMap()->isSameAs(*BlockNumber.getMap()), std::runtime_error,
"GetMatrixMaxMinusOffDiagonal: BlockNumber must match's A's column map.");
630 RCP<const Map> rowMap = A.getRowMap();
631 auto diag = Xpetra::VectorFactory<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Build(rowMap,
false);
634 using local_vector_type =
typename Vector::dual_view_type::t_dev_um;
635 using local_matrix_type =
typename Matrix::local_matrix_type;
636 using execution_space =
typename local_vector_type::execution_space;
637 using values_type =
typename local_matrix_type::values_type;
638 using scalar_type =
typename values_type::non_const_value_type;
639 using KAT_S =
typename Kokkos::ArithTraits<scalar_type>;
641 auto diag_dev = diag->getDeviceLocalView(Xpetra::Access::OverwriteAll);
642 auto local_mat_dev = A.getLocalMatrixDevice();
643 auto local_block_dev = BlockNumber.getDeviceLocalView(Xpetra::Access::ReadOnly);
644 Kokkos::RangePolicy<execution_space, int> my_policy(0,
static_cast<int>(diag_dev.extent(0)));
646 Kokkos::parallel_for(
647 "GetMatrixMaxMinusOffDiagonal", my_policy,
649 auto mymax = KAT_S::zero();
650 auto row = local_mat_dev.row(rowIdx);
651 for (
LocalOrdinal entryIdx = 0; entryIdx < row.length; ++entryIdx) {
652 if ((rowIdx != row.colidx(entryIdx)) && (local_block_dev(rowIdx, 0) == local_block_dev(row.colidx(entryIdx), 0))) {
653 if (KAT_S::real(mymax) < -KAT_S::real(row.value(entryIdx)))
654 mymax = -KAT_S::real(row.value(entryIdx));
657 diag_dev(rowIdx, 0) = mymax;
663template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
664Teuchos::RCP<Xpetra::Vector<Scalar, LocalOrdinal, GlobalOrdinal, Node>>
666 GetInverse(Teuchos::RCP<
const Xpetra::Vector<Scalar, LocalOrdinal, GlobalOrdinal, Node>> v,
typename Teuchos::ScalarTraits<Scalar>::magnitudeType tol,
Scalar valReplacement) {
667 RCP<Vector> ret = Xpetra::VectorFactory<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Build(v->getMap(),
true);
670 RCP<const BlockedVector> bv = Teuchos::rcp_dynamic_cast<const BlockedVector>(v);
671 if (bv.is_null() ==
false) {
672 RCP<BlockedVector> bret = Teuchos::rcp_dynamic_cast<BlockedVector>(ret);
673 TEUCHOS_TEST_FOR_EXCEPTION(bret.is_null() ==
true,
MueLu::Exceptions::RuntimeError,
"MueLu::UtilitiesBase::GetInverse: return vector should be of type BlockedVector");
674 RCP<const BlockedMap> bmap = bv->getBlockedMap();
675 for (
size_t r = 0; r < bmap->getNumMaps(); ++r) {
676 RCP<const MultiVector> submvec = bv->getMultiVector(r, bmap->getThyraMode());
677 RCP<const Vector> subvec = submvec->getVector(0);
679 bret->setMultiVector(r, subvecinf, bmap->getThyraMode());
685 ArrayRCP<Scalar> retVals = ret->getDataNonConst(0);
686 ArrayRCP<const Scalar> inputVals = v->getData(0);
687 for (
size_t i = 0; i < v->getMap()->getLocalNumElements(); ++i) {
688 if (Teuchos::ScalarTraits<Scalar>::magnitude(inputVals[i]) > tol)
689 retVals[i] = Teuchos::ScalarTraits<Scalar>::one() / inputVals[i];
691 retVals[i] = valReplacement;
734template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
735RCP<Xpetra::Vector<Scalar, LocalOrdinal, GlobalOrdinal, Node>>
738 RCP<const Map> rowMap = A.getRowMap(), colMap = A.getColMap();
740 RCP<Vector> diagonal = VectorFactory::Build(colMap);
741 RCP<const Import> importer = A.getCrsGraph()->getImporter();
742 if (importer == Teuchos::null) {
743 importer = ImportFactory::Build(rowMap, colMap);
745 diagonal->doImport(*localDiag, *(importer), Xpetra::INSERT);
750template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
751RCP<Xpetra::Vector<Scalar, LocalOrdinal, GlobalOrdinal, Node>>
754 using STS =
typename Teuchos::ScalarTraits<SC>;
757 RCP<const Map> rowMap = A.getRowMap(), colMap = A.getColMap();
758 RCP<const BlockedMap> browMap = Teuchos::rcp_dynamic_cast<const BlockedMap>(rowMap);
759 if (!browMap.is_null()) rowMap = browMap->getMap();
761 RCP<Vector> local = Xpetra::VectorFactory<SC, LO, GO, Node>::Build(rowMap);
762 RCP<Vector> ghosted = Xpetra::VectorFactory<SC, LO, GO, Node>::Build(colMap,
true);
763 ArrayRCP<SC> localVals = local->getDataNonConst(0);
765 for (LO row = 0; row < static_cast<LO>(A.getRowMap()->getLocalNumElements()); ++row) {
766 size_t nnz = A.getNumEntriesInLocalRow(row);
767 ArrayView<const LO> indices;
768 ArrayView<const SC> vals;
769 A.getLocalRowView(row, indices, vals);
773 for (LO colID = 0; colID < static_cast<LO>(nnz); colID++) {
774 if (indices[colID] != row) {
781 RCP<const Xpetra::Import<LO, GO, Node>> importer;
782 importer = A.getCrsGraph()->getImporter();
783 if (importer == Teuchos::null) {
784 importer = Xpetra::ImportFactory<LO, GO, Node>::Build(rowMap, colMap);
786 ghosted->doImport(*local, *(importer), Xpetra::INSERT);
790template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
794 RCP<const Map> rowMap = A.getRowMap(), colMap = A.getColMap();
795 using STS =
typename Teuchos::ScalarTraits<Scalar>;
796 using MTS =
typename Teuchos::ScalarTraits<Magnitude>;
798 using RealValuedVector = Xpetra::Vector<MT, LO, GO, Node>;
801 RCP<const BlockedMap> browMap = Teuchos::rcp_dynamic_cast<const BlockedMap>(rowMap);
802 if (!browMap.is_null()) rowMap = browMap->getMap();
804 RCP<RealValuedVector> local = Xpetra::VectorFactory<MT, LO, GO, Node>::Build(rowMap);
805 RCP<RealValuedVector> ghosted = Xpetra::VectorFactory<MT, LO, GO, Node>::Build(colMap,
true);
806 ArrayRCP<MT> localVals = local->getDataNonConst(0);
808 for (LO rowIdx = 0; rowIdx < static_cast<LO>(A.getRowMap()->getLocalNumElements()); ++rowIdx) {
809 size_t nnz = A.getNumEntriesInLocalRow(rowIdx);
810 ArrayView<const LO> indices;
811 ArrayView<const SC> vals;
812 A.getLocalRowView(rowIdx, indices, vals);
816 for (LO colID = 0; colID < static_cast<LO>(nnz); ++colID) {
817 if (indices[colID] != rowIdx) {
818 si += STS::magnitude(vals[colID]);
821 localVals[rowIdx] = si;
824 RCP<const Xpetra::Import<LO, GO, Node>> importer;
825 importer = A.getCrsGraph()->getImporter();
826 if (importer == Teuchos::null) {
827 importer = Xpetra::ImportFactory<LO, GO, Node>::Build(rowMap, colMap);
829 ghosted->doImport(*local, *(importer), Xpetra::INSERT);
833template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
834Teuchos::Array<typename Teuchos::ScalarTraits<Scalar>::magnitudeType>
836 ResidualNorm(
const Xpetra::Operator<Scalar, LocalOrdinal, GlobalOrdinal, Node>& Op,
const MultiVector& X,
const MultiVector& RHS) {
837 TEUCHOS_TEST_FOR_EXCEPTION(X.getNumVectors() != RHS.getNumVectors(),
Exceptions::RuntimeError,
"Number of solution vectors != number of right-hand sides")
838 const size_t numVecs = X.getNumVectors();
839 RCP<MultiVector> RES =
Residual(Op, X, RHS);
840 Teuchos::Array<Magnitude> norms(numVecs);
845template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
846Teuchos::Array<typename Teuchos::ScalarTraits<Scalar>::magnitudeType>
848 ResidualNorm(
const Xpetra::Operator<Scalar, LocalOrdinal, GlobalOrdinal, Node>& Op,
const MultiVector& X,
const MultiVector& RHS, MultiVector& Resid) {
849 TEUCHOS_TEST_FOR_EXCEPTION(X.getNumVectors() != RHS.getNumVectors(),
Exceptions::RuntimeError,
"Number of solution vectors != number of right-hand sides")
850 const size_t numVecs = X.getNumVectors();
852 Teuchos::Array<Magnitude> norms(numVecs);
857template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
858RCP<Xpetra::MultiVector<Scalar, LocalOrdinal, GlobalOrdinal, Node>>
860 Residual(
const Xpetra::Operator<Scalar, LocalOrdinal, GlobalOrdinal, Node>& Op,
const MultiVector& X,
const MultiVector& RHS) {
861 TEUCHOS_TEST_FOR_EXCEPTION(X.getNumVectors() != RHS.getNumVectors(),
Exceptions::RuntimeError,
"Number of solution vectors != number of right-hand sides")
862 const size_t numVecs = X.getNumVectors();
864 RCP<MultiVector> RES = Xpetra::MultiVectorFactory<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Build(RHS.getMap(), numVecs,
false);
865 Op.residual(X, RHS, *RES);
869template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
871 Residual(
const Xpetra::Operator<Scalar, LocalOrdinal, GlobalOrdinal, Node>& Op,
const MultiVector& X,
const MultiVector& RHS, MultiVector& Resid) {
872 TEUCHOS_TEST_FOR_EXCEPTION(X.getNumVectors() != RHS.getNumVectors(),
Exceptions::RuntimeError,
"Number of solution vectors != number of right-hand sides");
873 TEUCHOS_TEST_FOR_EXCEPTION(Resid.getNumVectors() != RHS.getNumVectors(),
Exceptions::RuntimeError,
"Number of residual vectors != number of right-hand sides");
874 Op.residual(X, RHS, Resid);
877template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
881 LocalOrdinal niters,
typename Teuchos::ScalarTraits<Scalar>::magnitudeType tolerance,
bool verbose,
unsigned int seed) {
883 "Utils::PowerMethod: operator must have domain and range maps that are equivalent.");
886 RCP<Vector> diagInvVec;
888 diagInvVec = GetMatrixDiagonalInverse(A);
891 Scalar lambda = PowerMethod(A, diagInvVec, niters, tolerance, verbose, seed);
895template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
898 PowerMethod(
const Matrix& A,
const RCP<Vector>& diagInvVec,
899 LocalOrdinal niters,
typename Teuchos::ScalarTraits<Scalar>::magnitudeType tolerance,
bool verbose,
unsigned int seed) {
901 "Utils::PowerMethod: operator must have domain and range maps that are equivalent.");
904 RCP<Vector> q = Xpetra::VectorFactory<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Build(A.getDomainMap());
905 RCP<Vector> r = Xpetra::VectorFactory<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Build(A.getRangeMap());
906 RCP<Vector> z = Xpetra::VectorFactory<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Build(A.getRangeMap());
911 Teuchos::Array<Magnitude> norms(1);
913 typedef Teuchos::ScalarTraits<Scalar> STS;
915 const Scalar zero = STS::zero(), one = STS::one();
918 Magnitude residual = STS::magnitude(zero);
921 for (
int iter = 0; iter < niters; ++iter) {
923 q->update(one / norms[0], *z, zero);
925 if (diagInvVec != Teuchos::null)
926 z->elementWiseMultiply(one, *diagInvVec, *z, zero);
929 if (iter % 100 == 0 || iter + 1 == niters) {
930 r->update(1.0, *z, -lambda, *q, zero);
932 residual = STS::magnitude(norms[0] / lambda);
934 std::cout <<
"Iter = " << iter
935 <<
" Lambda = " << lambda
936 <<
" Residual of A*q - lambda*q = " << residual
940 if (residual < tolerance)
946template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
947RCP<Teuchos::FancyOStream>
950 RCP<Teuchos::FancyOStream> fancy = Teuchos::fancyOStream(Teuchos::rcpFromRef(os));
954template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
955typename Teuchos::ScalarTraits<Scalar>::magnitudeType
958 const size_t numVectors = v.size();
960 Scalar d = Teuchos::ScalarTraits<Scalar>::zero();
961 for (
size_t j = 0; j < numVectors; j++) {
962 d += (v[j][i0] - v[j][i1]) * (v[j][i0] - v[j][i1]);
964 return Teuchos::ScalarTraits<Scalar>::magnitude(d);
967template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
968typename Teuchos::ScalarTraits<Scalar>::magnitudeType
971 const size_t numVectors = v.size();
972 using MT =
typename Teuchos::ScalarTraits<Scalar>::magnitudeType;
974 Scalar d = Teuchos::ScalarTraits<Scalar>::zero();
975 for (
size_t j = 0; j < numVectors; j++) {
976 d += Teuchos::as<MT>(weight[j]) * (v[j][i0] - v[j][i1]) * (v[j][i0] - v[j][i1]);
978 return Teuchos::ScalarTraits<Scalar>::magnitude(d);
981template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
982Teuchos::ArrayRCP<const bool>
984 DetectDirichletRows(
const Xpetra::Matrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>& A,
const typename Teuchos::ScalarTraits<Scalar>::magnitudeType& tol,
bool count_twos_as_dirichlet) {
986 typedef Teuchos::ScalarTraits<Scalar> STS;
987 ArrayRCP<bool> boundaryNodes(numRows,
true);
988 if (count_twos_as_dirichlet) {
990 ArrayView<const LocalOrdinal> indices;
991 ArrayView<const Scalar> vals;
992 A.getLocalRowView(row, indices, vals);
993 size_t nnz = A.getNumEntriesInLocalRow(row);
996 for (col = 0; col < nnz; col++)
997 if ((indices[col] != row) && STS::magnitude(vals[col]) > tol) {
998 if (!boundaryNodes[row])
1000 boundaryNodes[row] =
false;
1003 boundaryNodes[row] =
true;
1008 ArrayView<const LocalOrdinal> indices;
1009 ArrayView<const Scalar> vals;
1010 A.getLocalRowView(row, indices, vals);
1011 size_t nnz = A.getNumEntriesInLocalRow(row);
1013 for (
size_t col = 0; col < nnz; col++)
1014 if ((indices[col] != row) && STS::magnitude(vals[col]) > tol) {
1015 boundaryNodes[row] =
false;
1020 return boundaryNodes;
1023template <
class SC,
class LO,
class GO,
class NO,
class memory_space>
1024Kokkos::View<bool*, memory_space>
1026 const typename Teuchos::ScalarTraits<SC>::magnitudeType& tol,
1027 const bool count_twos_as_dirichlet) {
1028 using impl_scalar_type =
typename Kokkos::ArithTraits<SC>::val_type;
1029 using ATS = Kokkos::ArithTraits<impl_scalar_type>;
1030 using range_type = Kokkos::RangePolicy<LO, typename NO::execution_space>;
1031 using helpers = Xpetra::Helpers<SC, LO, GO, NO>;
1033 Kokkos::View<bool*, typename NO::device_type::memory_space> boundaryNodes;
1035 if (helpers::isTpetraBlockCrs(A)) {
1036 const Tpetra::BlockCrsMatrix<SC, LO, GO, NO>& Am = toTpetraBlock(A);
1037 auto b_graph = Am.getCrsGraph().getLocalGraphDevice();
1038 auto b_rowptr = Am.getCrsGraph().getLocalRowPtrsDevice();
1039 auto values = Am.getValuesDevice();
1040 LO numBlockRows = Am.getLocalNumRows();
1041 const LO stride = Am.getBlockSize() * Am.getBlockSize();
1043 boundaryNodes = Kokkos::View<bool*, typename NO::device_type::memory_space>(Kokkos::ViewAllocateWithoutInitializing(
"boundaryNodes"), numBlockRows);
1045 if (count_twos_as_dirichlet)
1048 Kokkos::parallel_for(
1049 "MueLu:Utils::DetectDirichletRowsBlockCrs", range_type(0, numBlockRows),
1050 KOKKOS_LAMBDA(
const LO row) {
1051 auto rowView = b_graph.rowConst(row);
1052 auto length = rowView.length;
1053 LO valstart = b_rowptr[row] * stride;
1055 boundaryNodes(row) =
true;
1056 decltype(length) colID = 0;
1057 for (; colID < length; colID++) {
1058 if (rowView.colidx(colID) != row) {
1059 LO current = valstart + colID * stride;
1060 for (LO k = 0; k < stride; k++) {
1061 if (ATS::magnitude(values[current + k]) > tol) {
1062 boundaryNodes(row) =
false;
1067 if (boundaryNodes(row) ==
false)
1072 auto localMatrix = A.getLocalMatrixDevice();
1073 LO numRows = A.getLocalNumRows();
1074 boundaryNodes = Kokkos::View<bool*, typename NO::device_type::memory_space>(Kokkos::ViewAllocateWithoutInitializing(
"boundaryNodes"), numRows);
1076 if (count_twos_as_dirichlet)
1077 Kokkos::parallel_for(
1078 "MueLu:Utils::DetectDirichletRows_Twos_As_Dirichlet", range_type(0, numRows),
1079 KOKKOS_LAMBDA(
const LO row) {
1080 auto rowView = localMatrix.row(row);
1081 auto length = rowView.length;
1083 boundaryNodes(row) =
true;
1085 decltype(length) colID = 0;
1086 for (; colID < length; colID++)
1087 if ((rowView.colidx(colID) != row) &&
1088 (ATS::magnitude(rowView.value(colID)) > tol)) {
1089 if (!boundaryNodes(row))
1091 boundaryNodes(row) =
false;
1093 if (colID == length)
1094 boundaryNodes(row) =
true;
1098 Kokkos::parallel_for(
1099 "MueLu:Utils::DetectDirichletRows", range_type(0, numRows),
1100 KOKKOS_LAMBDA(
const LO row) {
1101 auto rowView = localMatrix.row(row);
1102 auto length = rowView.length;
1104 boundaryNodes(row) =
true;
1105 for (
decltype(length) colID = 0; colID < length; colID++)
1106 if ((rowView.colidx(colID) != row) &&
1107 (ATS::magnitude(rowView.value(colID)) > tol)) {
1108 boundaryNodes(row) =
false;
1113 if constexpr (std::is_same<memory_space, typename NO::device_type::memory_space>::value)
1114 return boundaryNodes;
1116 Kokkos::View<bool*, memory_space> boundaryNodes2(Kokkos::ViewAllocateWithoutInitializing(
"boundaryNodes"), boundaryNodes.extent(0));
1117 Kokkos::deep_copy(boundaryNodes2, boundaryNodes);
1118 return boundaryNodes2;
1121 Kokkos::View<bool*, memory_space> dummy(
"dummy", 0);
1125template <
class SC,
class LO,
class GO,
class NO>
1126Kokkos::View<bool*, typename NO::device_type::memory_space>
1129 const typename Teuchos::ScalarTraits<SC>::magnitudeType& tol,
1130 const bool count_twos_as_dirichlet) {
1134template <
class SC,
class LO,
class GO,
class NO>
1135Kokkos::View<bool*, typename Kokkos::HostSpace>
1138 const typename Teuchos::ScalarTraits<SC>::magnitudeType& tol,
1139 const bool count_twos_as_dirichlet) {
1143template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1144Teuchos::ArrayRCP<const bool>
1146 DetectDirichletRowsExt(
const Xpetra::Matrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>& A,
bool& bHasZeroDiagonal,
const typename Teuchos::ScalarTraits<Scalar>::magnitudeType& tol) {
1148 bHasZeroDiagonal =
false;
1150 Teuchos::RCP<Vector> diagVec = Xpetra::VectorFactory<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Build(A.getRowMap());
1151 A.getLocalDiagCopy(*diagVec);
1152 Teuchos::ArrayRCP<const Scalar> diagVecData = diagVec->getData(0);
1155 typedef Teuchos::ScalarTraits<Scalar> STS;
1156 ArrayRCP<bool> boundaryNodes(numRows,
false);
1158 ArrayView<const LocalOrdinal> indices;
1159 ArrayView<const Scalar> vals;
1160 A.getLocalRowView(row, indices, vals);
1162 bool bHasDiag =
false;
1163 for (
decltype(indices.size()) col = 0; col < indices.size(); col++) {
1164 if (indices[col] != row) {
1165 if (STS::magnitude(vals[col] / STS::magnitude(sqrt(STS::magnitude(diagVecData[row]) * STS::magnitude(diagVecData[col])))) > tol) {
1171 if (bHasDiag ==
false)
1172 bHasZeroDiagonal =
true;
1174 boundaryNodes[row] =
true;
1176 return boundaryNodes;
1179template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1182 const Xpetra::MultiVector<Scalar, LocalOrdinal, GlobalOrdinal, Node>& RHS,
1183 Xpetra::MultiVector<Scalar, LocalOrdinal, GlobalOrdinal, Node>& InitialGuess,
1184 const typename Teuchos::ScalarTraits<SC>::magnitudeType& tol,
1185 const bool count_twos_as_dirichlet) {
1186 using range_type = Kokkos::RangePolicy<LO, typename Node::execution_space>;
1192 TEUCHOS_ASSERT_EQUALITY(numVectors, Teuchos::as<LocalOrdinal>(InitialGuess.getNumVectors()));
1194 TEUCHOS_ASSERT(RHS.getMap()->isCompatible(InitialGuess.getMap()));
1197 auto lclRHS = RHS.getDeviceLocalView(Xpetra::Access::ReadOnly);
1198 auto lclInitialGuess = InitialGuess.getDeviceLocalView(Xpetra::Access::ReadWrite);
1200 Kokkos::parallel_for(
1201 "MueLu:Utils::EnforceInitialCondition", range_type(0, numRows),
1202 KOKKOS_LAMBDA(
const LO row) {
1203 if (dirichletRows(row)) {
1205 lclInitialGuess(row, j) = lclRHS(row, j);
1210template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1212 FindNonZeros(
const Teuchos::ArrayRCP<const Scalar> vals,
1213 Teuchos::ArrayRCP<bool> nonzeros) {
1214 TEUCHOS_ASSERT(vals.size() == nonzeros.size());
1215 typedef typename Teuchos::ScalarTraits<Scalar>::magnitudeType magnitudeType;
1216 const magnitudeType eps = 2.0 * Teuchos::ScalarTraits<magnitudeType>::eps();
1217 for (
size_t i = 0; i < static_cast<size_t>(vals.size()); i++) {
1218 nonzeros[i] = (Teuchos::ScalarTraits<Scalar>::magnitude(vals[i]) > eps);
1223template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1225 FindNonZeros(
const typename Xpetra::MultiVector<Scalar, LocalOrdinal, GlobalOrdinal, Node>::dual_view_type::t_dev_const_um vals,
1226 Kokkos::View<bool*, typename Node::device_type> nonzeros) {
1227 using ATS = Kokkos::ArithTraits<Scalar>;
1228 using impl_ATS = Kokkos::ArithTraits<typename ATS::val_type>;
1229 using range_type = Kokkos::RangePolicy<LocalOrdinal, typename Node::execution_space>;
1230 TEUCHOS_ASSERT(vals.extent(0) == nonzeros.extent(0));
1231 const typename ATS::magnitudeType eps = 2.0 * impl_ATS::eps();
1233 Kokkos::parallel_for(
1234 "MueLu:Maxwell1::FindNonZeros", range_type(0, vals.extent(0)),
1235 KOKKOS_LAMBDA(
const size_t i) {
1236 nonzeros(i) = (impl_ATS::magnitude(vals(i, 0)) > eps);
1240template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1243 const Teuchos::ArrayRCP<bool>& dirichletRows,
1244 Teuchos::ArrayRCP<bool> dirichletCols,
1245 Teuchos::ArrayRCP<bool> dirichletDomain) {
1246 const Scalar one = Teuchos::ScalarTraits<Scalar>::one();
1247 RCP<const Xpetra::Map<LocalOrdinal, GlobalOrdinal, Node>> domMap = A.getDomainMap();
1248 RCP<const Xpetra::Map<LocalOrdinal, GlobalOrdinal, Node>> rowMap = A.getRowMap();
1249 RCP<const Xpetra::Map<LocalOrdinal, GlobalOrdinal, Node>> colMap = A.getColMap();
1250 TEUCHOS_ASSERT(
static_cast<size_t>(dirichletRows.size()) == rowMap->getLocalNumElements());
1251 TEUCHOS_ASSERT(
static_cast<size_t>(dirichletCols.size()) == colMap->getLocalNumElements());
1252 TEUCHOS_ASSERT(
static_cast<size_t>(dirichletDomain.size()) == domMap->getLocalNumElements());
1253 RCP<Xpetra::MultiVector<Scalar, LocalOrdinal, GlobalOrdinal, Node>> myColsToZero = Xpetra::MultiVectorFactory<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Build(colMap, 1,
true);
1255 for (
size_t i = 0; i < (size_t)dirichletRows.size(); i++) {
1256 if (dirichletRows[i]) {
1257 ArrayView<const LocalOrdinal> indices;
1258 ArrayView<const Scalar> values;
1259 A.getLocalRowView(i, indices, values);
1260 for (
size_t j = 0; j < static_cast<size_t>(indices.size()); j++)
1261 myColsToZero->replaceLocalValue(indices[j], 0, one);
1265 RCP<Xpetra::MultiVector<Scalar, LocalOrdinal, GlobalOrdinal, Node>> globalColsToZero;
1266 RCP<const Xpetra::Import<LocalOrdinal, GlobalOrdinal, Node>> importer = A.getCrsGraph()->getImporter();
1267 if (!importer.is_null()) {
1268 globalColsToZero = Xpetra::MultiVectorFactory<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Build(domMap, 1,
true);
1270 globalColsToZero->doExport(*myColsToZero, *importer, Xpetra::ADD);
1272 myColsToZero->doImport(*globalColsToZero, *importer, Xpetra::INSERT);
1274 globalColsToZero = myColsToZero;
1276 FindNonZeros(globalColsToZero->getData(0), dirichletDomain);
1280template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1283 const Kokkos::View<bool*, typename Node::device_type>& dirichletRows,
1284 Kokkos::View<bool*, typename Node::device_type> dirichletCols,
1285 Kokkos::View<bool*, typename Node::device_type> dirichletDomain) {
1286 using ATS = Kokkos::ArithTraits<Scalar>;
1287 using impl_ATS = Kokkos::ArithTraits<typename ATS::val_type>;
1288 using range_type = Kokkos::RangePolicy<LocalOrdinal, typename Node::execution_space>;
1289 RCP<const Xpetra::Map<LocalOrdinal, GlobalOrdinal, Node>> domMap = A.getDomainMap();
1290 RCP<const Xpetra::Map<LocalOrdinal, GlobalOrdinal, Node>> rowMap = A.getRowMap();
1291 RCP<const Xpetra::Map<LocalOrdinal, GlobalOrdinal, Node>> colMap = A.getColMap();
1292 TEUCHOS_ASSERT(dirichletRows.extent(0) == rowMap->getLocalNumElements());
1293 TEUCHOS_ASSERT(dirichletCols.extent(0) == colMap->getLocalNumElements());
1294 TEUCHOS_ASSERT(dirichletDomain.extent(0) == domMap->getLocalNumElements());
1295 RCP<Xpetra::Vector<Scalar, LocalOrdinal, GlobalOrdinal, Node>> myColsToZero = Xpetra::VectorFactory<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Build(colMap,
true);
1297 auto myColsToZeroView = myColsToZero->getDeviceLocalView(Xpetra::Access::ReadWrite);
1298 auto localMatrix = A.getLocalMatrixDevice();
1299 Kokkos::parallel_for(
1300 "MueLu:Maxwell1::DetectDirichletCols", range_type(0, rowMap->getLocalNumElements()),
1302 if (dirichletRows(row)) {
1303 auto rowView = localMatrix.row(row);
1304 auto length = rowView.length;
1306 for (
decltype(length) colID = 0; colID < length; colID++)
1307 myColsToZeroView(rowView.colidx(colID), 0) = impl_ATS::one();
1311 RCP<Xpetra::Vector<Scalar, LocalOrdinal, GlobalOrdinal, Node>> globalColsToZero;
1312 RCP<const Xpetra::Import<LocalOrdinal, GlobalOrdinal, Node>> importer = A.getCrsGraph()->getImporter();
1313 if (!importer.is_null()) {
1314 globalColsToZero = Xpetra::VectorFactory<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Build(domMap,
true);
1316 globalColsToZero->doExport(*myColsToZero, *importer, Xpetra::ADD);
1318 myColsToZero->doImport(*globalColsToZero, *importer, Xpetra::INSERT);
1320 globalColsToZero = myColsToZero;
1325template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1327 ApplyRowSumCriterion(
const Xpetra::Matrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>& A,
const typename Teuchos::ScalarTraits<Scalar>::magnitudeType rowSumTol, Teuchos::ArrayRCP<bool>& dirichletRows) {
1328 typedef Teuchos::ScalarTraits<Scalar> STS;
1329 typedef typename Teuchos::ScalarTraits<Scalar>::magnitudeType MT;
1330 typedef Teuchos::ScalarTraits<MT> MTS;
1331 RCP<const Xpetra::Map<LocalOrdinal, GlobalOrdinal, Node>> rowmap = A.getRowMap();
1332 for (
LocalOrdinal row = 0; row < Teuchos::as<LocalOrdinal>(rowmap->getLocalNumElements()); ++row) {
1333 size_t nnz = A.getNumEntriesInLocalRow(row);
1334 ArrayView<const LocalOrdinal> indices;
1335 ArrayView<const Scalar> vals;
1336 A.getLocalRowView(row, indices, vals);
1338 Scalar rowsum = STS::zero();
1339 Scalar diagval = STS::zero();
1341 for (
LocalOrdinal colID = 0; colID < Teuchos::as<LocalOrdinal>(nnz); colID++) {
1344 diagval = vals[colID];
1345 rowsum += vals[colID];
1348 if (rowSumTol < MTS::one() && STS::magnitude(rowsum) > STS::magnitude(diagval) * rowSumTol) {
1350 dirichletRows[row] =
true;
1355template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1357 ApplyRowSumCriterion(
const Xpetra::Matrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>& A,
const Xpetra::Vector<LocalOrdinal, LocalOrdinal, GlobalOrdinal, Node>& BlockNumber,
const typename Teuchos::ScalarTraits<Scalar>::magnitudeType rowSumTol, Teuchos::ArrayRCP<bool>& dirichletRows) {
1358 typedef Teuchos::ScalarTraits<Scalar> STS;
1359 typedef typename Teuchos::ScalarTraits<Scalar>::magnitudeType MT;
1360 typedef Teuchos::ScalarTraits<MT> MTS;
1361 RCP<const Xpetra::Map<LocalOrdinal, GlobalOrdinal, Node>> rowmap = A.getRowMap();
1363 TEUCHOS_TEST_FOR_EXCEPTION(!A.getColMap()->isSameAs(*BlockNumber.getMap()), std::runtime_error,
"ApplyRowSumCriterion: BlockNumber must match's A's column map.");
1365 Teuchos::ArrayRCP<const LocalOrdinal> block_id = BlockNumber.getData(0);
1366 for (
LocalOrdinal row = 0; row < Teuchos::as<LocalOrdinal>(rowmap->getLocalNumElements()); ++row) {
1367 size_t nnz = A.getNumEntriesInLocalRow(row);
1368 ArrayView<const LocalOrdinal> indices;
1369 ArrayView<const Scalar> vals;
1370 A.getLocalRowView(row, indices, vals);
1372 Scalar rowsum = STS::zero();
1373 Scalar diagval = STS::zero();
1374 for (
LocalOrdinal colID = 0; colID < Teuchos::as<LocalOrdinal>(nnz); colID++) {
1377 diagval = vals[colID];
1378 if (block_id[row] == block_id[col])
1379 rowsum += vals[colID];
1383 if (rowSumTol < MTS::one() && STS::magnitude(rowsum) > STS::magnitude(diagval) * rowSumTol) {
1385 dirichletRows[row] =
true;
1391template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node,
class memory_space>
1393 const typename Teuchos::ScalarTraits<Scalar>::magnitudeType rowSumTol,
1394 Kokkos::View<bool*, memory_space>& dirichletRows) {
1395 typedef Teuchos::ScalarTraits<Scalar> STS;
1396 RCP<const Xpetra::Map<LocalOrdinal, GlobalOrdinal, Node>> rowmap = A.getRowMap();
1398 auto dirichletRowsHost = Kokkos::create_mirror_view(dirichletRows);
1399 Kokkos::deep_copy(dirichletRowsHost, dirichletRows);
1401 for (
LocalOrdinal row = 0; row < Teuchos::as<LocalOrdinal>(rowmap->getLocalNumElements()); ++row) {
1402 size_t nnz = A.getNumEntriesInLocalRow(row);
1403 ArrayView<const LocalOrdinal> indices;
1404 ArrayView<const Scalar> vals;
1405 A.getLocalRowView(row, indices, vals);
1407 Scalar rowsum = STS::zero();
1408 Scalar diagval = STS::zero();
1409 for (
LocalOrdinal colID = 0; colID < Teuchos::as<LocalOrdinal>(nnz); colID++) {
1412 diagval = vals[colID];
1413 rowsum += vals[colID];
1415 if (STS::real(rowsum) > STS::magnitude(diagval) * rowSumTol)
1416 dirichletRowsHost(row) =
true;
1419 Kokkos::deep_copy(dirichletRows, dirichletRowsHost);
1422template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1425 const typename Teuchos::ScalarTraits<Scalar>::magnitudeType rowSumTol,
1426 Kokkos::View<bool*, typename Node::device_type::memory_space>& dirichletRows) {
1430template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1433 const typename Teuchos::ScalarTraits<Scalar>::magnitudeType rowSumTol,
1434 Kokkos::View<bool*, Kokkos::HostSpace>& dirichletRows) {
1439template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node,
class memory_space>
1441 const Xpetra::Vector<LocalOrdinal, LocalOrdinal, GlobalOrdinal, Node>& BlockNumber,
1442 const typename Teuchos::ScalarTraits<Scalar>::magnitudeType rowSumTol,
1443 Kokkos::View<bool*, memory_space>& dirichletRows) {
1444 typedef Teuchos::ScalarTraits<Scalar> STS;
1445 RCP<const Xpetra::Map<LocalOrdinal, GlobalOrdinal, Node>> rowmap = A.getRowMap();
1447 TEUCHOS_TEST_FOR_EXCEPTION(!A.getColMap()->isSameAs(*BlockNumber.getMap()), std::runtime_error,
"ApplyRowSumCriterion: BlockNumber must match's A's column map.");
1449 auto dirichletRowsHost = Kokkos::create_mirror_view(dirichletRows);
1450 Kokkos::deep_copy(dirichletRowsHost, dirichletRows);
1452 Teuchos::ArrayRCP<const LocalOrdinal> block_id = BlockNumber.getData(0);
1453 for (
LocalOrdinal row = 0; row < Teuchos::as<LocalOrdinal>(rowmap->getLocalNumElements()); ++row) {
1454 size_t nnz = A.getNumEntriesInLocalRow(row);
1455 ArrayView<const LocalOrdinal> indices;
1456 ArrayView<const Scalar> vals;
1457 A.getLocalRowView(row, indices, vals);
1459 Scalar rowsum = STS::zero();
1460 Scalar diagval = STS::zero();
1461 for (
LocalOrdinal colID = 0; colID < Teuchos::as<LocalOrdinal>(nnz); colID++) {
1464 diagval = vals[colID];
1465 if (block_id[row] == block_id[col])
1466 rowsum += vals[colID];
1468 if (STS::real(rowsum) > STS::magnitude(diagval) * rowSumTol)
1469 dirichletRowsHost(row) =
true;
1472 Kokkos::deep_copy(dirichletRows, dirichletRowsHost);
1475template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1478 const Xpetra::Vector<LocalOrdinal, LocalOrdinal, GlobalOrdinal, Node>& BlockNumber,
1479 const typename Teuchos::ScalarTraits<Scalar>::magnitudeType rowSumTol,
1480 Kokkos::View<bool*, typename Node::device_type::memory_space>& dirichletRows) {
1484template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1487 const Xpetra::Vector<LocalOrdinal, LocalOrdinal, GlobalOrdinal, Node>& BlockNumber,
1488 const typename Teuchos::ScalarTraits<Scalar>::magnitudeType rowSumTol,
1489 Kokkos::View<bool*, Kokkos::HostSpace>& dirichletRows) {
1493template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1494Teuchos::ArrayRCP<const bool>
1497 const Teuchos::ArrayRCP<const bool>& dirichletRows) {
1498 Scalar zero = Teuchos::ScalarTraits<Scalar>::zero();
1499 Scalar one = Teuchos::ScalarTraits<Scalar>::one();
1500 Teuchos::RCP<const Xpetra::Map<LocalOrdinal, GlobalOrdinal, Node>> domMap = A.getDomainMap();
1501 Teuchos::RCP<const Xpetra::Map<LocalOrdinal, GlobalOrdinal, Node>> colMap = A.getColMap();
1502 Teuchos::RCP<Xpetra::MultiVector<Scalar, LocalOrdinal, GlobalOrdinal, Node>> myColsToZero = Xpetra::MultiVectorFactory<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Build(colMap, 1);
1503 myColsToZero->putScalar(zero);
1505 for (
size_t i = 0; i < (size_t)dirichletRows.size(); i++) {
1506 if (dirichletRows[i]) {
1507 Teuchos::ArrayView<const LocalOrdinal> indices;
1508 Teuchos::ArrayView<const Scalar> values;
1509 A.getLocalRowView(i, indices, values);
1510 for (
size_t j = 0; j < static_cast<size_t>(indices.size()); j++)
1511 myColsToZero->replaceLocalValue(indices[j], 0, one);
1515 Teuchos::RCP<Xpetra::MultiVector<Scalar, LocalOrdinal, GlobalOrdinal, Node>> globalColsToZero = Xpetra::MultiVectorFactory<Scalar, LocalOrdinal, GlobalOrdinal, Node>::Build(domMap, 1);
1516 globalColsToZero->putScalar(zero);
1517 Teuchos::RCP<Xpetra::Export<LocalOrdinal, GlobalOrdinal, Node>> exporter = Xpetra::ExportFactory<LocalOrdinal, GlobalOrdinal, Node>::Build(colMap, domMap);
1519 globalColsToZero->doExport(*myColsToZero, *exporter, Xpetra::ADD);
1521 myColsToZero->doImport(*globalColsToZero, *exporter, Xpetra::INSERT);
1522 Teuchos::ArrayRCP<const Scalar> myCols = myColsToZero->getData(0);
1523 Teuchos::ArrayRCP<bool> dirichletCols(colMap->getLocalNumElements(),
true);
1524 Magnitude eps = Teuchos::ScalarTraits<Magnitude>::eps();
1525 for (
size_t i = 0; i < colMap->getLocalNumElements(); i++) {
1526 dirichletCols[i] = Teuchos::ScalarTraits<Scalar>::magnitude(myCols[i]) > 2.0 * eps;
1528 return dirichletCols;
1531template <
class SC,
class LO,
class GO,
class NO>
1532Kokkos::View<bool*, typename NO::device_type>
1535 const Kokkos::View<const bool*, typename NO::device_type>& dirichletRows) {
1536 using ATS = Kokkos::ArithTraits<SC>;
1537 using impl_ATS = Kokkos::ArithTraits<typename ATS::val_type>;
1538 using range_type = Kokkos::RangePolicy<LO, typename NO::execution_space>;
1540 SC zero = ATS::zero();
1542 auto localMatrix = A.getLocalMatrixDevice();
1543 LO numRows = A.getLocalNumRows();
1545 Teuchos::RCP<const Xpetra::Map<LO, GO, NO>> domMap = A.getDomainMap();
1546 Teuchos::RCP<const Xpetra::Map<LO, GO, NO>> colMap = A.getColMap();
1547 Teuchos::RCP<Xpetra::MultiVector<SC, LO, GO, NO>> myColsToZero = Xpetra::MultiVectorFactory<SC, LO, GO, NO>::Build(colMap, 1);
1548 myColsToZero->putScalar(zero);
1549 auto myColsToZeroView = myColsToZero->getDeviceLocalView(Xpetra::Access::ReadWrite);
1551 Kokkos::parallel_for(
1552 "MueLu:Utils::DetectDirichletCols1", range_type(0, numRows),
1553 KOKKOS_LAMBDA(
const LO row) {
1554 if (dirichletRows(row)) {
1555 auto rowView = localMatrix.row(row);
1556 auto length = rowView.length;
1558 for (
decltype(length) colID = 0; colID < length; colID++)
1559 myColsToZeroView(rowView.colidx(colID), 0) = impl_ATS::one();
1563 Teuchos::RCP<Xpetra::MultiVector<SC, LO, GO, NO>> globalColsToZero = Xpetra::MultiVectorFactory<SC, LO, GO, NO>::Build(domMap, 1);
1564 globalColsToZero->putScalar(zero);
1565 Teuchos::RCP<Xpetra::Export<LO, GO, NO>> exporter = Xpetra::ExportFactory<LO, GO, NO>::Build(colMap, domMap);
1567 globalColsToZero->doExport(*myColsToZero, *exporter, Xpetra::ADD);
1569 myColsToZero->doImport(*globalColsToZero, *exporter, Xpetra::INSERT);
1571 auto myCols = myColsToZero->getDeviceLocalView(Xpetra::Access::ReadOnly);
1572 size_t numColEntries = colMap->getLocalNumElements();
1573 Kokkos::View<bool*, typename NO::device_type> dirichletCols(Kokkos::ViewAllocateWithoutInitializing(
"dirichletCols"), numColEntries);
1574 const typename ATS::magnitudeType eps = 2.0 * ATS::eps();
1576 Kokkos::parallel_for(
1577 "MueLu:Utils::DetectDirichletCols2", range_type(0, numColEntries),
1578 KOKKOS_LAMBDA(
const size_t i) {
1579 dirichletCols(i) = impl_ATS::magnitude(myCols(i, 0)) > eps;
1581 return dirichletCols;
1584template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1587 Frobenius(
const Xpetra::Matrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>& A,
const Xpetra::Matrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>& B) {
1592 TEUCHOS_TEST_FOR_EXCEPTION(!A.getRowMap()->isSameAs(*B.getRowMap()),
Exceptions::Incompatible,
"MueLu::CGSolver::Frobenius: row maps are incompatible");
1593 TEUCHOS_TEST_FOR_EXCEPTION(!A.isFillComplete() || !B.isFillComplete(),
Exceptions::RuntimeError,
"Matrices must be fill completed");
1595 const Map& AColMap = *A.getColMap();
1596 const Map& BColMap = *B.getColMap();
1598 Teuchos::ArrayView<const LocalOrdinal> indA, indB;
1599 Teuchos::ArrayView<const Scalar> valA, valB;
1600 size_t nnzA = 0, nnzB = 0;
1612 Teuchos::Array<Scalar> valBAll(BColMap.getLocalNumElements());
1614 LocalOrdinal invalid = Teuchos::OrdinalTraits<LocalOrdinal>::invalid();
1615 Scalar zero = Teuchos::ScalarTraits<Scalar>::zero(), f = zero, gf;
1616 size_t numRows = A.getLocalNumRows();
1617 for (
size_t i = 0; i < numRows; i++) {
1618 A.getLocalRowView(i, indA, valA);
1619 B.getLocalRowView(i, indB, valB);
1624 for (
size_t j = 0; j < nnzB; j++)
1625 valBAll[indB[j]] = valB[j];
1627 for (
size_t j = 0; j < nnzA; j++) {
1630 LocalOrdinal ind = BColMap.getLocalElement(AColMap.getGlobalElement(indA[j]));
1632 f += valBAll[ind] * valA[j];
1636 for (
size_t j = 0; j < nnzB; j++)
1637 valBAll[indB[j]] = zero;
1645template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1653 int maxint = INT_MAX;
1654 int mySeed = Teuchos::as<int>((maxint - 1) * (one - (comm.getRank() + 1) / (comm.getSize() + one)));
1655 if (mySeed < 1 || mySeed == maxint) {
1656 std::ostringstream errStr;
1657 errStr <<
"Error detected with random seed = " << mySeed <<
". It should be in the interval [1,2^31-2].";
1662 Teuchos::ScalarTraits<Scalar>::seedrandom(mySeed);
1669template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1671 FindDirichletRows(Teuchos::RCP<Xpetra::Matrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>>& A,
1672 std::vector<LocalOrdinal>& dirichletRows,
bool count_twos_as_dirichlet) {
1673 typedef typename Teuchos::ScalarTraits<Scalar>::magnitudeType MT;
1674 dirichletRows.resize(0);
1675 for (
size_t i = 0; i < A->getLocalNumRows(); i++) {
1676 Teuchos::ArrayView<const LocalOrdinal> indices;
1677 Teuchos::ArrayView<const Scalar> values;
1678 A->getLocalRowView(i, indices, values);
1680 for (
size_t j = 0; j < (size_t)indices.size(); j++) {
1681 if (Teuchos::ScalarTraits<Scalar>::magnitude(values[j]) > Teuchos::ScalarTraits<MT>::eps()) {
1685 if (nnz == 1 || (count_twos_as_dirichlet && nnz == 2)) {
1686 dirichletRows.push_back(i);
1691template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1693 ApplyOAZToMatrixRows(Teuchos::RCP<Xpetra::Matrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>>& A,
1694 const std::vector<LocalOrdinal>& dirichletRows) {
1695 RCP<const Map> Rmap = A->getRowMap();
1696 RCP<const Map> Cmap = A->getColMap();
1697 Scalar one = Teuchos::ScalarTraits<Scalar>::one();
1698 Scalar zero = Teuchos::ScalarTraits<Scalar>::zero();
1700 for (
size_t i = 0; i < dirichletRows.size(); i++) {
1701 GlobalOrdinal row_gid = Rmap->getGlobalElement(dirichletRows[i]);
1703 Teuchos::ArrayView<const LocalOrdinal> indices;
1704 Teuchos::ArrayView<const Scalar> values;
1705 A->getLocalRowView(dirichletRows[i], indices, values);
1707 Scalar* valuesNC =
const_cast<Scalar*
>(values.getRawPtr());
1708 for (
size_t j = 0; j < (size_t)indices.size(); j++) {
1709 if (Cmap->getGlobalElement(indices[j]) == row_gid)
1717template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1719 ApplyOAZToMatrixRows(Teuchos::RCP<Xpetra::Matrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>>& A,
1720 const Teuchos::ArrayRCP<const bool>& dirichletRows) {
1721 TEUCHOS_ASSERT(A->isFillComplete());
1722 RCP<const Map> domMap = A->getDomainMap();
1723 RCP<const Map> ranMap = A->getRangeMap();
1724 RCP<const Map> Rmap = A->getRowMap();
1725 RCP<const Map> Cmap = A->getColMap();
1726 TEUCHOS_ASSERT(
static_cast<size_t>(dirichletRows.size()) == Rmap->getLocalNumElements());
1727 const Scalar one = Teuchos::ScalarTraits<Scalar>::one();
1728 const Scalar zero = Teuchos::ScalarTraits<Scalar>::zero();
1730 for (
size_t i = 0; i < (size_t)dirichletRows.size(); i++) {
1731 if (dirichletRows[i]) {
1734 Teuchos::ArrayView<const LocalOrdinal> indices;
1735 Teuchos::ArrayView<const Scalar> values;
1736 A->getLocalRowView(i, indices, values);
1738 Teuchos::ArrayRCP<Scalar> valuesNC(values.size());
1739 for (
size_t j = 0; j < (size_t)indices.size(); j++) {
1740 if (Cmap->getGlobalElement(indices[j]) == row_gid)
1745 A->replaceLocalValues(i, indices, valuesNC());
1748 A->fillComplete(domMap, ranMap);
1751template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1753 ApplyOAZToMatrixRows(Teuchos::RCP<Xpetra::Matrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>>& A,
1754 const Kokkos::View<const bool*, typename Node::device_type>& dirichletRows) {
1755 TEUCHOS_ASSERT(A->isFillComplete());
1756 using ATS = Kokkos::ArithTraits<Scalar>;
1757 using impl_ATS = Kokkos::ArithTraits<typename ATS::val_type>;
1758 using range_type = Kokkos::RangePolicy<LocalOrdinal, typename Node::execution_space>;
1760 RCP<const Xpetra::Map<LocalOrdinal, GlobalOrdinal, Node>> domMap = A->getDomainMap();
1761 RCP<const Xpetra::Map<LocalOrdinal, GlobalOrdinal, Node>> ranMap = A->getRangeMap();
1762 RCP<const Xpetra::Map<LocalOrdinal, GlobalOrdinal, Node>> Rmap = A->getRowMap();
1763 RCP<const Xpetra::Map<LocalOrdinal, GlobalOrdinal, Node>> Cmap = A->getColMap();
1765 TEUCHOS_ASSERT(
static_cast<size_t>(dirichletRows.size()) == Rmap->getLocalNumElements());
1767 auto localMatrix = A->getLocalMatrixDevice();
1768 auto localRmap = Rmap->getLocalMap();
1769 auto localCmap = Cmap->getLocalMap();
1771 Kokkos::parallel_for(
1772 "MueLu::Utils::ApplyOAZ", range_type(0, dirichletRows.extent(0)),
1774 if (dirichletRows(row)) {
1775 auto rowView = localMatrix.row(row);
1776 auto length = rowView.length;
1777 auto row_gid = localRmap.getGlobalElement(row);
1778 auto row_lid = localCmap.getLocalElement(row_gid);
1780 for (
decltype(length) colID = 0; colID < length; colID++)
1781 if (rowView.colidx(colID) == row_lid)
1782 rowView.value(colID) = impl_ATS::one();
1784 rowView.value(colID) = impl_ATS::zero();
1789template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1791 ZeroDirichletRows(Teuchos::RCP<Xpetra::Matrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>>& A,
1792 const std::vector<LocalOrdinal>& dirichletRows,
1794 for (
size_t i = 0; i < dirichletRows.size(); i++) {
1795 Teuchos::ArrayView<const LocalOrdinal> indices;
1796 Teuchos::ArrayView<const Scalar> values;
1797 A->getLocalRowView(dirichletRows[i], indices, values);
1799 Scalar* valuesNC =
const_cast<Scalar*
>(values.getRawPtr());
1800 for (
size_t j = 0; j < (size_t)indices.size(); j++)
1801 valuesNC[j] = replaceWith;
1805template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1807 ZeroDirichletRows(Teuchos::RCP<Xpetra::Matrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>>& A,
1808 const Teuchos::ArrayRCP<const bool>& dirichletRows,
1810 TEUCHOS_ASSERT(
static_cast<size_t>(dirichletRows.size()) == A->getRowMap()->getLocalNumElements());
1811 for (
size_t i = 0; i < (size_t)dirichletRows.size(); i++) {
1812 if (dirichletRows[i]) {
1813 Teuchos::ArrayView<const LocalOrdinal> indices;
1814 Teuchos::ArrayView<const Scalar> values;
1815 A->getLocalRowView(i, indices, values);
1817 Scalar* valuesNC =
const_cast<Scalar*
>(values.getRawPtr());
1818 for (
size_t j = 0; j < (size_t)indices.size(); j++)
1819 valuesNC[j] = replaceWith;
1824template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1826 ZeroDirichletRows(Teuchos::RCP<Xpetra::MultiVector<Scalar, LocalOrdinal, GlobalOrdinal, Node>>& X,
1827 const Teuchos::ArrayRCP<const bool>& dirichletRows,
1829 TEUCHOS_ASSERT(
static_cast<size_t>(dirichletRows.size()) == X->getMap()->getLocalNumElements());
1830 for (
size_t i = 0; i < (size_t)dirichletRows.size(); i++) {
1831 if (dirichletRows[i]) {
1832 for (
size_t j = 0; j < X->getNumVectors(); j++)
1833 X->replaceLocalValue(i, j, replaceWith);
1838template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1840 ZeroDirichletRows(RCP<Xpetra::Matrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>>& A,
1841 const Kokkos::View<const bool*, typename Node::device_type>& dirichletRows,
1843 using ATS = Kokkos::ArithTraits<Scalar>;
1844 using range_type = Kokkos::RangePolicy<LocalOrdinal, typename Node::execution_space>;
1846 typename ATS::val_type impl_replaceWith = replaceWith;
1848 auto localMatrix = A->getLocalMatrixDevice();
1851 Kokkos::parallel_for(
1852 "MueLu:Utils::ZeroDirichletRows", range_type(0, numRows),
1854 if (dirichletRows(row)) {
1855 auto rowView = localMatrix.row(row);
1856 auto length = rowView.length;
1857 for (
decltype(length) colID = 0; colID < length; colID++)
1858 rowView.value(colID) = impl_replaceWith;
1863template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1865 ZeroDirichletRows(RCP<Xpetra::MultiVector<Scalar, LocalOrdinal, GlobalOrdinal, Node>>& X,
1866 const Kokkos::View<const bool*, typename Node::device_type>& dirichletRows,
1868 using ATS = Kokkos::ArithTraits<Scalar>;
1869 using range_type = Kokkos::RangePolicy<LocalOrdinal, typename Node::execution_space>;
1871 typename ATS::val_type impl_replaceWith = replaceWith;
1873 auto myCols = X->getDeviceLocalView(Xpetra::Access::ReadWrite);
1874 size_t numVecs = X->getNumVectors();
1875 Kokkos::parallel_for(
1876 "MueLu:Utils::ZeroDirichletRows_MV", range_type(0, dirichletRows.size()),
1877 KOKKOS_LAMBDA(
const size_t i) {
1878 if (dirichletRows(i)) {
1879 for (
size_t j = 0; j < numVecs; j++)
1880 myCols(i, j) = impl_replaceWith;
1885template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1888 const Teuchos::ArrayRCP<const bool>& dirichletCols,
1890 TEUCHOS_ASSERT(
static_cast<size_t>(dirichletCols.size()) == A->getColMap()->getLocalNumElements());
1891 for (
size_t i = 0; i < A->getLocalNumRows(); i++) {
1892 Teuchos::ArrayView<const LocalOrdinal> indices;
1893 Teuchos::ArrayView<const Scalar> values;
1894 A->getLocalRowView(i, indices, values);
1896 Scalar* valuesNC =
const_cast<Scalar*
>(values.getRawPtr());
1897 for (
size_t j = 0; j < static_cast<size_t>(indices.size()); j++)
1898 if (dirichletCols[indices[j]])
1899 valuesNC[j] = replaceWith;
1903template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1905 ZeroDirichletCols(RCP<Xpetra::Matrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>>& A,
1906 const Kokkos::View<const bool*, typename Node::device_type>& dirichletCols,
1908 using ATS = Kokkos::ArithTraits<Scalar>;
1909 using range_type = Kokkos::RangePolicy<LocalOrdinal, typename Node::execution_space>;
1911 typename ATS::val_type impl_replaceWith = replaceWith;
1913 auto localMatrix = A->getLocalMatrixDevice();
1916 Kokkos::parallel_for(
1917 "MueLu:Utils::ZeroDirichletCols", range_type(0, numRows),
1919 auto rowView = localMatrix.row(row);
1920 auto length = rowView.length;
1921 for (
decltype(length) colID = 0; colID < length; colID++)
1922 if (dirichletCols(rowView.colidx(colID))) {
1923 rowView.value(colID) = impl_replaceWith;
1928template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1931 Teuchos::RCP<Xpetra::Vector<int, LocalOrdinal, GlobalOrdinal, Node>>& isDirichletRow,
1932 Teuchos::RCP<Xpetra::Vector<int, LocalOrdinal, GlobalOrdinal, Node>>& isDirichletCol) {
1934 if (!A->getRowMap()->isSameAs(*A->getDomainMap())) {
1935 throw std::runtime_error(
"UtilitiesBase::FindDirichletRowsAndPropagateToCols row and domain maps must match.");
1937 RCP<const Xpetra::Import<LocalOrdinal, GlobalOrdinal, Node>> importer = A->getCrsGraph()->getImporter();
1938 bool has_import = !importer.is_null();
1941 std::vector<LocalOrdinal> dirichletRows;
1945 printf(
"[%d] DirichletRow Ids = ",A->getRowMap()->getComm()->getRank());
1946 for(
size_t i=0; i<(size_t) dirichletRows.size(); i++)
1947 printf(
"%d ",dirichletRows[i]);
1952 isDirichletRow = Xpetra::VectorFactory<int, LocalOrdinal, GlobalOrdinal, Node>::Build(A->getRowMap(),
true);
1953 isDirichletCol = Xpetra::VectorFactory<int, LocalOrdinal, GlobalOrdinal, Node>::Build(A->getColMap(),
true);
1956 Teuchos::ArrayRCP<int> dr_rcp = isDirichletRow->getDataNonConst(0);
1957 Teuchos::ArrayView<int> dr = dr_rcp();
1958 Teuchos::ArrayRCP<int> dc_rcp = isDirichletCol->getDataNonConst(0);
1959 Teuchos::ArrayView<int> dc = dc_rcp();
1960 for (
size_t i = 0; i < (size_t)dirichletRows.size(); i++) {
1961 dr[dirichletRows[i]] = 1;
1962 if (!has_import) dc[dirichletRows[i]] = 1;
1967 isDirichletCol->doImport(*isDirichletRow, *importer, Xpetra::CombineMode::ADD);
1970template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
1971RCP<Xpetra::Matrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>>
1974 using ISC =
typename Kokkos::ArithTraits<Scalar>::val_type;
1975 using range_type = Kokkos::RangePolicy<LocalOrdinal, typename Node::execution_space>;
1976 using local_matrix_type =
typename CrsMatrix::local_matrix_type;
1977 using values_type =
typename local_matrix_type::values_type;
1979 const ISC ONE = Kokkos::ArithTraits<ISC>::one();
1980 const ISC ZERO = Kokkos::ArithTraits<ISC>::zero();
1983 auto localMatrix = original->getLocalMatrixDevice();
1984 TEUCHOS_TEST_FOR_EXCEPTION(!original->hasCrsGraph(),
Exceptions::RuntimeError,
"ReplaceNonZerosWithOnes: Cannot get CrsGraph");
1985 values_type new_values(
"values", localMatrix.nnz());
1987 Kokkos::parallel_for(
1988 "ReplaceNonZerosWithOnes", range_type(0, localMatrix.nnz()), KOKKOS_LAMBDA(
const size_t i) {
1989 if (localMatrix.values(i) != ZERO)
1990 new_values(i) = ONE;
1992 new_values(i) = ZERO;
1996 RCP<Matrix> NewMatrix = Xpetra::MatrixFactory<SC, LO, GO, NO>::Build(original->getCrsGraph(), new_values);
1997 TEUCHOS_TEST_FOR_EXCEPTION(NewMatrix.is_null(),
Exceptions::RuntimeError,
"ReplaceNonZerosWithOnes: MatrixFactory::Build() did not return matrix");
1998 NewMatrix->fillComplete(original->getDomainMap(), original->getRangeMap());
2002template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
2003RCP<const Xpetra::BlockedMap<LocalOrdinal, GlobalOrdinal, Node>>
2006 const Xpetra::Import<LocalOrdinal, GlobalOrdinal, Node>& Importer) {
2007 typedef Xpetra::Vector<int, LocalOrdinal, GlobalOrdinal, Node> IntVector;
2008 Xpetra::UnderlyingLib lib = sourceBlockedMap.lib();
2011 RCP<const Map> fullMap = sourceBlockedMap.getMap();
2012 RCP<const Map> stridedMap = Teuchos::rcp_dynamic_cast<const Xpetra::StridedMap<LocalOrdinal, GlobalOrdinal, Node>>(fullMap);
2013 if (!stridedMap.is_null()) fullMap = stridedMap->getMap();
2016 const size_t numSubMaps = sourceBlockedMap.getNumMaps();
2017 if (!Importer.getSourceMap()->isCompatible(*fullMap))
2018 throw std::runtime_error(
"GenerateBlockedTargetMap(): Map compatibility error");
2021 RCP<IntVector> block_ids = Xpetra::VectorFactory<int, LocalOrdinal, GlobalOrdinal, Node>::Build(fullMap);
2023 for (
size_t i = 0; i < numSubMaps; i++) {
2024 RCP<const Map> map = sourceBlockedMap.getMap(i);
2026 for (
size_t j = 0; j < map->getLocalNumElements(); j++) {
2027 LocalOrdinal jj = fullMap->getLocalElement(map->getGlobalElement(j));
2028 block_ids->replaceLocalValue(jj, (
int)i);
2033 RCP<const Map> targetMap = Importer.getTargetMap();
2034 RCP<IntVector> new_block_ids = Xpetra::VectorFactory<int, LocalOrdinal, GlobalOrdinal, Node>::Build(targetMap);
2035 new_block_ids->doImport(*block_ids, Importer, Xpetra::CombineMode::ADD);
2036 Teuchos::ArrayRCP<const int> dataRCP = new_block_ids->getData(0);
2037 Teuchos::ArrayView<const int> data = dataRCP();
2040 Teuchos::Array<Teuchos::Array<GlobalOrdinal>> elementsInSubMap(numSubMaps);
2041 for (
size_t i = 0; i < targetMap->getLocalNumElements(); i++) {
2042 elementsInSubMap[data[i]].push_back(targetMap->getGlobalElement(i));
2046 std::vector<RCP<const Map>> subMaps(numSubMaps);
2047 for (
size_t i = 0; i < numSubMaps; i++) {
2048 subMaps[i] = Xpetra::MapFactory<LocalOrdinal, GlobalOrdinal, Node>::Build(lib, Teuchos::OrdinalTraits<GlobalOrdinal>::invalid(), elementsInSubMap[i](), targetMap->getIndexBase(), targetMap->getComm());
2052 return rcp(
new BlockedMap(targetMap, subMaps));
2055template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
2057 MapsAreNested(
const Xpetra::Map<LocalOrdinal, GlobalOrdinal, Node>& rowMap,
const Xpetra::Map<LocalOrdinal, GlobalOrdinal, Node>& colMap) {
2058 ArrayView<const GlobalOrdinal> rowElements = rowMap.getLocalElementList();
2059 ArrayView<const GlobalOrdinal> colElements = colMap.getLocalElementList();
2061 const size_t numElements = rowElements.size();
2063 if (
size_t(colElements.size()) < numElements)
2066 bool goodMap =
true;
2067 for (
size_t i = 0; i < numElements; i++)
2068 if (rowElements[i] != colElements[i]) {
2076template <
class Scalar,
class LocalOrdinal,
class GlobalOrdinal,
class Node>
2077Teuchos::RCP<Xpetra::Vector<LocalOrdinal, LocalOrdinal, GlobalOrdinal, Node>>
2079 ReverseCuthillMcKee(
const Xpetra::Matrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>& Op) {
2080 using local_matrix_type =
typename Xpetra::Matrix<Scalar, LocalOrdinal, GlobalOrdinal, Node>::local_matrix_type;
2081 using local_graph_type =
typename local_matrix_type::staticcrsgraph_type;
2082 using lno_nnz_view_t =
typename local_graph_type::entries_type::non_const_type;
2083 using device =
typename local_graph_type::device_type;
2084 using execution_space =
typename local_matrix_type::execution_space;
2085 using ordinal_type =
typename local_matrix_type::ordinal_type;
2087 local_graph_type localGraph = Op.getLocalMatrixDevice().graph;
2089 lno_nnz_view_t rcmOrder = KokkosGraph::Experimental::graph_rcm<device, typename local_graph_type::row_map_type, typename local_graph_type::entries_type, lno_nnz_view_t>(localGraph.row_map, localGraph.entries);
2091 RCP<Xpetra::Vector<LocalOrdinal, LocalOrdinal, GlobalOrdinal, Node>> retval =
2092 Xpetra::VectorFactory<LocalOrdinal, LocalOrdinal, GlobalOrdinal, Node>::Build(Op.getRowMap());
2095 auto view1D = Kokkos::subview(retval->getDeviceLocalView(Xpetra::Access::ReadWrite), Kokkos::ALL(), 0);
2096 Kokkos::parallel_for(
2097 "Utilities::ReverseCuthillMcKee",
2098 Kokkos::RangePolicy<ordinal_type, execution_space>(0, localGraph.numRows()),
2099 KOKKOS_LAMBDA(
const ordinal_type rowIdx) {
2100 view1D(rcmOrder(rowIdx)) = rowIdx;