46 #ifndef MUELU_UTILITIES_KOKKOS_DECL_HPP
47 #define MUELU_UTILITIES_KOKKOS_DECL_HPP
50 #if defined(HAVE_MUELU_KOKKOS_REFACTOR)
74 #ifdef HAVE_MUELU_EPETRA
75 #include <Epetra_MultiVector.h>
76 #include <Epetra_CrsMatrix.h>
82 #include "MueLu_Utilities.hpp"
83 #include "MueLu_UtilitiesBase.hpp"
85 #ifdef HAVE_MUELU_TPETRA
86 #include <Tpetra_CrsMatrix.hpp>
87 #include <Tpetra_Map.hpp>
88 #include <Tpetra_MultiVector.hpp>
103 template <
class Scalar,
104 class LocalOrdinal = int,
105 class GlobalOrdinal = LocalOrdinal,
108 #undef MUELU_UTILITIES_KOKKOS_SHORT
115 #ifdef HAVE_MUELU_EPETRA
118 static RCP<const Epetra_MultiVector> MV2EpetraMV(RCP<MultiVector>
const vec) {
return Utilities::MV2EpetraMV(vec); }
134 #ifdef HAVE_MUELU_TPETRA
137 static RCP<const Tpetra::MultiVector<SC,LO,GO,NO> > MV2TpetraMV(RCP<MultiVector>
const vec) {
return Utilities::MV2TpetraMV(vec); }
144 static RCP<const Tpetra::CrsMatrix<SC,LO,GO,NO> > Op2TpetraCrs(RCP<const Matrix> Op) {
return Utilities::Op2TpetraCrs(Op); }
150 static RCP<const Tpetra::RowMatrix<SC,LO,GO,NO> > Op2TpetraRow(RCP<const Matrix> Op) {
return Utilities::Op2TpetraRow(Op); }
156 static RCP<Xpetra::Matrix<SC,LO,GO,NO> > Crs2Op(RCP<CrsMatrix> Op) {
return Utilities::Crs2Op(Op); }
193 static RCP<Vector> GetMatrixOverlappedDiagonal(
const Matrix& A);
216 static void PauseForDebugger();
233 static SC PowerMethod(
const Matrix& A,
bool scaleByDiag =
true,
234 LO niters = 10, Magnitude tolerance = 1e-2,
bool verbose =
false,
unsigned int seed = 123) {
239 bool doFillComplete =
true,
bool doOptimizeStorage =
true);
242 bool doFillComplete,
bool doOptimizeStorage);
245 bool doFillComplete,
bool doOptimizeStorage);
247 static RCP<Teuchos::FancyOStream> MakeFancy(std::ostream& os) {
return Utilities::MakeFancy(os); }
268 static Kokkos::View<const bool*, typename NO::device_type>
DetectDirichletCols(
const Matrix& A,
const Kokkos::View<const bool*, typename NO::device_type>& dirichletRows);
277 static RCP<MultiVector> RealValuedToScalarMultiVector(RCP<RealValuedMultiVector> X);
295 static RCP<Matrix> Transpose(Matrix& Op,
bool optimizeTranspose =
false,
const std::string & label = std::string()) {
299 static RCP<Xpetra::MultiVector<double,LocalOrdinal,GlobalOrdinal,Node> > ExtractCoordinatesFromParameterList(ParameterList& paramList) {
315 template <
class Node>
316 class Utilities_kokkos<double,int,int,Node> :
public UtilitiesBase<double,int,int,Node> {
318 typedef double Scalar;
319 typedef int LocalOrdinal;
320 typedef int GlobalOrdinal;
325 #undef MUELU_UTILITIES_KOKKOS_SHORT
330 #ifdef HAVE_MUELU_EPETRA
333 static RCP<const Epetra_MultiVector> MV2EpetraMV(RCP<MultiVector>
const vec) {
return Utilities::MV2EpetraMV(vec); }
349 #ifdef HAVE_MUELU_TPETRA
352 static RCP<const Tpetra::MultiVector<SC,LO,GO,NO> > MV2TpetraMV(RCP<MultiVector>
const vec) {
return Utilities::MV2TpetraMV(vec); }
359 static RCP<const Tpetra::CrsMatrix<SC,LO,GO,NO> > Op2TpetraCrs(RCP<const Matrix> Op) {
return Utilities::Op2TpetraCrs(Op); }
365 static RCP<const Tpetra::RowMatrix<SC,LO,GO,NO> > Op2TpetraRow(RCP<const Matrix> Op) {
return Utilities::Op2TpetraRow(Op); }
370 static RCP<Xpetra::Matrix<SC,LO,GO,NO> > Crs2Op(RCP<CrsMatrix> Op) {
return Utilities::Crs2Op(Op); }
372 static ArrayRCP<SC> GetMatrixDiagonal(
const Matrix& A) {
378 static ArrayRCP<SC> GetLumpedMatrixDiagonal(
const Matrix& A) {
381 static RCP<Vector> GetLumpedMatrixDiagonal(RCP<const Matrix > A) {
384 static RCP<Vector> GetMatrixOverlappedDiagonal(
const Matrix& A) {
396 static void PauseForDebugger() {
399 static RCP<Teuchos::FancyOStream> MakeFancy(std::ostream& os) {
409 static Kokkos::View<const bool*, typename Node::device_type>
DetectDirichletCols(
const Matrix& A,
const Kokkos::View<const bool*, typename Node::device_type>& dirichletRows);
417 static RCP<MultiVector> RealValuedToScalarMultiVector(RCP<RealValuedMultiVector> X);
419 static Scalar PowerMethod(
const Matrix& A,
bool scaleByDiag =
true,
LO niters = 10, Magnitude tolerance = 1e-2,
bool verbose =
false,
unsigned int seed = 123) {
424 bool doFillComplete =
true,
bool doOptimizeStorage =
true) {
428 for (
int i = 0; i < scalingVector.
size(); ++i)
429 sv[i] = one / scalingVector[i];
431 for (
int i = 0; i < scalingVector.
size(); ++i)
432 sv[i] = scalingVector[i];
435 switch (Op.getRowMap()->lib()) {
437 MyOldScaleMatrix_Tpetra(Op, sv, doFillComplete, doOptimizeStorage);
441 MyOldScaleMatrix_Epetra(Op, sv, doFillComplete, doOptimizeStorage);
445 throw Exceptions::RuntimeError(
"Only Epetra and Tpetra matrices can be scaled.");
446 #ifndef __NVCC__ //prevent nvcc warning
454 bool doFillComplete,
bool doOptimizeStorage) {
455 #ifdef HAVE_MUELU_TPETRA
456 #ifdef HAVE_MUELU_TPETRA_INST_INT_INT
460 const RCP<const Tpetra::Map<LO,GO,NO> > rowMap = tpOp.
getRowMap();
461 const RCP<const Tpetra::Map<LO,GO,NO> > domainMap = tpOp.
getDomainMap();
462 const RCP<const Tpetra::Map<LO,GO,NO> > rangeMap = tpOp.
getRangeMap();
465 if (maxRowSize == Teuchos::as<size_t>(-1))
468 std::vector<SC> scaledVals(maxRowSize);
472 if (Op.isLocallyIndexed() ==
true) {
476 for (
size_t i = 0; i < rowMap->getNodeNumElements(); ++i) {
479 if (nnz > maxRowSize) {
481 scaledVals.resize(maxRowSize);
483 for (
size_t j = 0; j < nnz; ++j)
484 scaledVals[j] = vals[j]*scalingVector[i];
496 for (
size_t i = 0; i < rowMap->getNodeNumElements(); ++i) {
497 GO gid = rowMap->getGlobalElement(i);
500 if (nnz > maxRowSize) {
502 scaledVals.resize(maxRowSize);
505 for (
size_t j = 0; j < nnz; ++j)
506 scaledVals[j] = vals[j]*scalingVector[i];
515 if (doFillComplete) {
516 if (domainMap == Teuchos::null || rangeMap == Teuchos::null)
517 throw Exceptions::RuntimeError(
"In Utilities::Scaling: cannot fillComplete because the domain and/or range map hasn't been defined");
520 params->
set(
"Optimize Storage", doOptimizeStorage);
521 params->
set(
"No Nonlocal Changes",
true);
522 Op.fillComplete(Op.getDomainMap(), Op.getRangeMap(), params);
525 throw Exceptions::RuntimeError(
"Only Tpetra::CrsMatrix types can be scaled (Err.1)");
528 throw Exceptions::RuntimeError(
"Matrix scaling is not possible because Tpetra has not been compiled with support for LO=GO=int.");
531 throw Exceptions::RuntimeError(
"Matrix scaling is not possible because Tpetra has not been enabled.");
535 static void MyOldScaleMatrix_Epetra(Matrix& Op,
const Teuchos::ArrayRCP<Scalar>& scalingVector,
bool doFillComplete,
bool doOptimizeStorage) {
536 #ifdef HAVE_MUELU_EPETRA
548 for (
int j = 0; j < nnz; ++j)
549 vals[j] *= scalingVector[i];
553 throw Exceptions::RuntimeError(
"Only Epetra_CrsMatrix types can be scaled");
556 throw Exceptions::RuntimeError(
"Matrix scaling is not possible because Epetra has not been enabled.");
557 #endif // HAVE_MUELU_EPETRA
565 static RCP<Matrix> Transpose(Matrix& Op,
bool optimizeTranspose =
false,
const std::string & label = std::string(),
const Teuchos::RCP<Teuchos::ParameterList> ¶ms=Teuchos::null) {
566 switch (Op.getRowMap()->lib()) {
569 #ifdef HAVE_MUELU_TPETRA
570 #ifdef HAVE_MUELU_TPETRA_INST_INT_INT
575 RCP<Tpetra::CrsMatrix<Scalar, LocalOrdinal, GlobalOrdinal, Node> > A;
577 A = transposer.createTranspose(params);
579 RCP<CrsMatrix> AAA = rcp_implicit_cast<CrsMatrix>(AA);
580 RCP<CrsMatrixWrap> AAAA =
rcp(
new CrsMatrixWrap(AAA));
584 catch (std::exception& e) {
585 std::cout <<
"threw exception '" << e.what() <<
"'" << std::endl;
586 throw Exceptions::RuntimeError(
"Utilities::Transpose failed, perhaps because matrix is not a Crs matrix");
589 throw Exceptions::RuntimeError(
"Utilities::Transpose: Tpetra is not compiled with LO=GO=int. Add TPETRA_INST_INT_INT:BOOL=ON to your configuration!");
592 throw Exceptions::RuntimeError(
"Utilities::Transpose: Tpetra is not compiled!");
594 #ifndef __NVCC__ //prevent nvcc warning
600 #if defined(HAVE_MUELU_EPETRA) && defined(HAVE_MUELU_EPETRAEXT)
604 EpetraExt::RowMatrix_Transpose transposer;
605 Epetra_CrsMatrix * A = dynamic_cast<Epetra_CrsMatrix*>(&transposer(epetraOp));
606 transposer.ReleaseTranspose();
608 RCP<Epetra_CrsMatrix> rcpA(A);
610 RCP<CrsMatrix> AAA = rcp_implicit_cast<CrsMatrix>(AA);
611 RCP<CrsMatrixWrap> AAAA =
rcp(
new CrsMatrixWrap(AAA));
612 AAAA->fillComplete(Op.getRangeMap(), Op.getDomainMap());
616 throw Exceptions::RuntimeError(
"Epetra (Err. 2)");
618 #ifndef __NVCC__ //prevent nvcc warning
623 throw Exceptions::RuntimeError(
"Only Epetra and Tpetra matrices can be transposed.");
624 #ifndef __NVCC__ //prevent nvcc warning
629 #ifndef __NVCC__ //prevent nvcc warning
630 return Teuchos::null;
636 static RCP<Xpetra::MultiVector<double,LO,GO,NO> > ExtractCoordinatesFromParameterList(ParameterList& paramList) {
637 RCP<Xpetra::MultiVector<double,LO,GO,NO> > coordinates = Teuchos::null;
640 if(paramList.isParameter (
"Coordinates") ==
false)
643 #if defined(HAVE_MUELU_TPETRA)
644 #if ( defined(EPETRA_HAVE_OMP) && defined(HAVE_TPETRA_INST_OPENMP) && defined(HAVE_TPETRA_INST_INT_INT)) || \
645 (!defined(EPETRA_HAVE_OMP) && defined(HAVE_TPETRA_INST_SERIAL) && defined(HAVE_TPETRA_INST_INT_INT))
650 #if !defined(HAVE_TPETRA_EXPLICIT_INSTANTIATION) || defined(HAVE_TPETRA_INST_FLOAT)
652 RCP<tfMV> floatCoords = Teuchos::null;
659 RCP<tdMV> doubleCoords = Teuchos::null;
660 if (paramList.isType<RCP<tdMV> >(
"Coordinates")) {
662 doubleCoords = paramList.get<RCP<tdMV> >(
"Coordinates");
663 paramList.remove(
"Coordinates");
665 #if !defined(HAVE_TPETRA_EXPLICIT_INSTANTIATION) || defined(HAVE_TPETRA_INST_FLOAT)
666 else if (paramList.isType<RCP<tfMV> >(
"Coordinates")) {
668 floatCoords = paramList.get<RCP<tfMV> >(
"Coordinates");
669 paramList.remove(
"Coordinates");
670 doubleCoords =
rcp(
new tdMV(floatCoords->getMap(), floatCoords->getNumVectors()));
675 if(doubleCoords != Teuchos::null) {
679 #endif // Tpetra instantiated on GO=int and EpetraNode
680 #endif // endif HAVE_TPETRA
682 #if defined(HAVE_MUELU_EPETRA)
683 RCP<Epetra_MultiVector> doubleEpCoords;
684 if (paramList.isType<RCP<Epetra_MultiVector> >(
"Coordinates")) {
685 doubleEpCoords = paramList.get<RCP<Epetra_MultiVector> >(
"Coordinates");
686 paramList.remove(
"Coordinates");
700 template <
class View,
unsigned AppendValue >
705 template <
class MT,
unsigned T >
706 struct CombineMemoryTraits {
710 template <
unsigned U,
unsigned T>
711 struct CombineMemoryTraits<Kokkos::MemoryTraits<U>, T> {
712 typedef Kokkos::MemoryTraits<U|T> type;
715 template <
class DataType,
unsigned T,
class... Pack >
716 struct AppendTrait< Kokkos::
View< DataType, Pack... >, T> {
717 typedef Kokkos::View< DataType, Pack... > view_type;
718 using type = Kokkos::View< DataType, typename view_type::array_layout, typename view_type::device_type, typename CombineMemoryTraits<typename view_type::memory_traits,T>::type >;
723 #define MUELU_UTILITIES_KOKKOS_SHORT
725 #endif // #if defined(HAVE_MUELU_KOKKOS_REFACTOR)
727 #endif // MUELU_UTILITIES_KOKKOS_DECL_HPP