[wip] [skip ci] Enable amgcl/opencl in trilinos application

ddemidov · ddemidov · commit e97e1f4835f5 · 2019-01-17T10:31:04.000+03:00
diff --git a/applications/trilinos_application/CMakeLists.txt b/applications/trilinos_application/CMakeLists.txt
@@ -50,6 +50,7 @@ set( KRATOS_TRILINOS_APPLICATION_SOURCES
 	${CMAKE_CURRENT_SOURCE_DIR}/custom_factories/trilinos_linear_solver_factory.cpp
     ${CMAKE_SOURCE_DIR}/applications/FluidDynamicsApplication/fluid_dynamics_application_variables.cpp  #TODO: this should REALLY NOT BE HERE
     ${CMAKE_CURRENT_SOURCE_DIR}/custom_utilities/mpi_normal_calculation_utilities.cpp;
+    ${CMAKE_CURRENT_SOURCE_DIR}/amgcl_mpi_solver_impl.cpp;
 )
 
 ## Kratos tests sources. Enabled by default
diff --git a/applications/trilinos_application/amgcl_mpi_solver_impl.cpp b/applications/trilinos_application/amgcl_mpi_solver_impl.cpp
@@ -0,0 +1,244 @@
+#ifndef KRATOS_AMGCL_MPI_SOLVE_FUNCTIONS_H
+#define KRATOS_AMGCL_MPI_SOLVE_FUNCTIONS_H
+
+#include <boost/range/iterator_range.hpp>
+#include <boost/property_tree/ptree.hpp>
+
+#include <amgcl/adapter/crs_tuple.hpp>
+#include <amgcl/adapter/epetra.hpp>
+#include <amgcl/adapter/ublas.hpp>
+#include <amgcl/adapter/zero_copy.hpp>
+#include <amgcl/adapter/block_matrix.hpp>
+#include <amgcl/backend/builtin.hpp>
+#include <amgcl/value_type/static_matrix.hpp>
+#include <amgcl/solver/runtime.hpp>
+
+#include <amgcl/mpi/util.hpp>
+#include <amgcl/mpi/make_solver.hpp>
+#include <amgcl/mpi/amg.hpp>
+#include <amgcl/mpi/coarsening/runtime.hpp>
+#include <amgcl/mpi/relaxation/runtime.hpp>
+#include <amgcl/mpi/direct_solver/runtime.hpp>
+#include <amgcl/mpi/partition/runtime.hpp>
+
+#ifdef KRATOS_HAVE_OPENCL
+#  include <amgcl/backend/vexcl.hpp>
+#  include <amgcl/backend/vexcl_static_matrix.hpp>
+#endif
+
+#include "Epetra_FECrsMatrix.h"
+#include "Epetra_FEVector.h"
+#include "trilinos_space.h"
+
+namespace Kratos
+{
+
+#ifdef KRATOS_HAVE_OPENCL
+vex::Context& vexcl_context();
+
+template <int TBlockSize>
+void register_vexcl_static_matrix_type();
+#endif
+
+// Spacialization of AMGCLScalarSolve for distribued systems.
+template <class TSparseSpaceType>
+typename std::enable_if<TSparseSpaceType::IsDistributed(), void>::type
+AMGCLScalarSolve(
+    typename TSparseSpaceType::MatrixType& rA,
+    typename TSparseSpaceType::VectorType& rX,
+    typename TSparseSpaceType::VectorType& rB,
+    typename TSparseSpaceType::IndexType& rIterationNumber,
+    double& rResidual,
+    const boost::property_tree::ptree &amgclParams,
+    int verbosity_level,
+    bool use_opencl
+    )
+{
+#ifdef KRATOS_HAVE_OPENCL
+    if (use_opencl && vexcl_context()) {
+        auto &ctx = vexcl_context();
+
+        typedef amgcl::backend::vexcl<double> Backend;
+
+        typedef
+            amgcl::mpi::make_solver<
+                amgcl::mpi::amg<
+                    Backend,
+                    amgcl::runtime::mpi::coarsening::wrapper<Backend>,
+                    amgcl::runtime::mpi::relaxation::wrapper<Backend>,
+                    amgcl::runtime::mpi::direct::solver<double>,
+                    amgcl::runtime::mpi::partition::wrapper<Backend>
+                    >,
+                amgcl::runtime::solver::wrapper
+                >
+            Solver;
+
+        Backend::params bprm;
+        bprm.q = ctx;
+
+        Solver solve(MPI_COMM_WORLD, amgcl::adapter::map(rA), amgclParams, bprm);
+
+        std::size_t n = rA.NumMyRows();
+
+        vex::vector<double> b(ctx, n, rB.Values());
+        vex::vector<double> x(ctx, n, rX.Values());
+
+        std::tie(rIterationNumber, rResidual) = solve(b, x);
+
+        vex::copy(x.begin(), x.end(), rX.Values());
+    } else
+#endif
+    {
+        typedef amgcl::backend::builtin<double> Backend;
+
+        typedef
+            amgcl::mpi::make_solver<
+                amgcl::mpi::amg<
+                    Backend,
+                    amgcl::runtime::mpi::coarsening::wrapper<Backend>,
+                    amgcl::runtime::mpi::relaxation::wrapper<Backend>,
+                    amgcl::runtime::mpi::direct::solver<double>,
+                    amgcl::runtime::mpi::partition::wrapper<Backend>
+                    >,
+                amgcl::runtime::solver::wrapper
+                >
+            Solver;
+
+        Solver solve(MPI_COMM_WORLD, amgcl::adapter::map(rA), amgclParams);
+
+        std::size_t n = rA.NumMyRows();
+
+        auto b_range = boost::make_iterator_range(rB.Values(), rB.Values() + n);
+        auto x_range = boost::make_iterator_range(rX.Values(), rX.Values() + n);
+
+        std::tie(rIterationNumber, rResidual) = solve(b_range, x_range);
+    }
+}
+
+// Spacialization of AMGCLBlockSolve for distribued systems.
+template <int TBlockSize, class TSparseSpaceType>
+typename std::enable_if<TSparseSpaceType::IsDistributed(), void>::type
+AMGCLBlockSolve(
+    typename TSparseSpaceType::MatrixType & rA,
+    typename TSparseSpaceType::VectorType& rX,
+    typename TSparseSpaceType::VectorType& rB,
+    typename TSparseSpaceType::IndexType& rIterationNumber,
+    double& rResidual,
+    boost::property_tree::ptree amgclParams,
+    int verbosity_level,
+    bool use_opencl
+    )
+{
+    amgclParams.put("precond.coarsening.aggr.block_size",1);
+
+    typedef amgcl::static_matrix<double, TBlockSize, TBlockSize> val_type;
+    typedef amgcl::static_matrix<double, TBlockSize, 1> rhs_type;
+
+    std::size_t n = rA.RowMap().NumMyElements();
+    std::size_t nb = n / TBlockSize;
+
+#ifdef KRATOS_HAVE_OPENCL
+    if (use_opencl && vexcl_context()) {
+        auto &ctx = vexcl_context();
+        register_vexcl_static_matrix_type<TBlockSize>();
+
+        typedef amgcl::backend::vexcl<val_type> Backend;
+
+        typedef
+            amgcl::mpi::make_solver<
+                amgcl::mpi::amg<
+                    Backend,
+                    amgcl::runtime::mpi::coarsening::wrapper<Backend>,
+                    amgcl::runtime::mpi::relaxation::wrapper<Backend>,
+                    amgcl::runtime::mpi::direct::solver<val_type>,
+                    amgcl::runtime::mpi::partition::wrapper<Backend>
+                    >,
+                amgcl::runtime::solver::wrapper
+                >
+            Solver;
+
+        typename Backend::params bprm;
+        bprm.q = ctx;
+
+        Solver solve(
+                MPI_COMM_WORLD,
+                amgcl::adapter::block_matrix<val_type>(amgcl::adapter::map(rA)),
+                amgclParams, bprm
+                );
+
+        auto b_begin = reinterpret_cast<const rhs_type*>(rB.Values());
+        auto x_begin = reinterpret_cast<rhs_type*>(rX.Values());
+
+        vex::vector<rhs_type> x(ctx, nb, x_begin);
+        vex::vector<rhs_type> b(ctx, nb, b_begin);
+
+        std::tie(rIterationNumber, rResidual) = solve(b, x);
+
+        vex::copy(x.begin(), x.end(), x_begin);
+    } else
+#endif
+    {
+        typedef amgcl::backend::builtin<val_type> Backend;
+
+        typedef
+            amgcl::mpi::make_solver<
+                amgcl::mpi::amg<
+                    Backend,
+                    amgcl::runtime::mpi::coarsening::wrapper<Backend>,
+                    amgcl::runtime::mpi::relaxation::wrapper<Backend>,
+                    amgcl::runtime::mpi::direct::solver<val_type>,
+                    amgcl::runtime::mpi::partition::wrapper<Backend>
+                    >,
+                amgcl::runtime::solver::wrapper
+                >
+            Solver;
+
+        Solver solve(
+                MPI_COMM_WORLD,
+                amgcl::adapter::block_matrix<val_type>(amgcl::adapter::map(rA)),
+                amgclParams
+                );
+
+        auto b_begin = reinterpret_cast<const rhs_type*>(rB.Values());
+        auto x_begin = reinterpret_cast<rhs_type*>(rX.Values());
+
+        auto b_range = boost::make_iterator_range(b_begin, b_begin + n / TBlockSize);
+        auto x_range = boost::make_iterator_range(x_begin, x_begin + n / TBlockSize);
+
+        std::tie(rIterationNumber, rResidual) = solve(b_range, x_range);
+    }
+}
+
+// Exlplicit instantiations:
+template void AMGCLScalarSolve< TrilinosSpace<Epetra_FECrsMatrix, Epetra_FEVector> >(
+    TrilinosSpace<Epetra_FECrsMatrix, Epetra_FEVector>::MatrixType& rA,
+    TrilinosSpace<Epetra_FECrsMatrix, Epetra_FEVector>::VectorType& rX,
+    TrilinosSpace<Epetra_FECrsMatrix, Epetra_FEVector>::VectorType& rB,
+    TrilinosSpace<Epetra_FECrsMatrix, Epetra_FEVector>::IndexType& rIterationNumber,
+    double& rResidual,
+    const boost::property_tree::ptree &amgclParams,
+    int verbosity_level,
+    bool use_opencl
+    );
+
+#define INSTANTIATE_BLOCK_SOLVER(B)                                                    \
+template void AMGCLBlockSolve<B, TrilinosSpace<Epetra_FECrsMatrix, Epetra_FEVector> >( \
+    TrilinosSpace<Epetra_FECrsMatrix, Epetra_FEVector>::MatrixType& rA,                \
+    TrilinosSpace<Epetra_FECrsMatrix, Epetra_FEVector>::VectorType& rX,                \
+    TrilinosSpace<Epetra_FECrsMatrix, Epetra_FEVector>::VectorType& rB,                \
+    TrilinosSpace<Epetra_FECrsMatrix, Epetra_FEVector>::IndexType& rIterationNumber,   \
+    double& rResidual,                                                                 \
+    boost::property_tree::ptree amgclParams,                                           \
+    int verbosity_level,                                                               \
+    bool use_opencl                                                                    \
+    )
+
+INSTANTIATE_BLOCK_SOLVER(2);
+INSTANTIATE_BLOCK_SOLVER(3);
+INSTANTIATE_BLOCK_SOLVER(4);
+
+#undef INSTANTIATE_BLOCK_SOLVER
+
+} // namespace Kratos
+
+#endif
diff --git a/applications/trilinos_application/external_includes/amgcl_mpi_solve_functions.h b/applications/trilinos_application/external_includes/amgcl_mpi_solve_functions.h
@@ -1,24 +1,7 @@
 #ifndef KRATOS_AMGCL_MPI_SOLVE_FUNCTIONS_H
 #define KRATOS_AMGCL_MPI_SOLVE_FUNCTIONS_H
 
-#include <boost/range/iterator_range.hpp>
-
-#include <amgcl/adapter/crs_tuple.hpp>
-#include <amgcl/adapter/epetra.hpp>
-#include <amgcl/adapter/ublas.hpp>
-#include <amgcl/adapter/zero_copy.hpp>
-#include <amgcl/adapter/block_matrix.hpp>
-#include <amgcl/backend/builtin.hpp>
-#include <amgcl/value_type/static_matrix.hpp>
-#include <amgcl/solver/runtime.hpp>
-
-#include <amgcl/mpi/util.hpp>
-#include <amgcl/mpi/make_solver.hpp>
-#include <amgcl/mpi/amg.hpp>
-#include <amgcl/mpi/coarsening/runtime.hpp>
-#include <amgcl/mpi/relaxation/runtime.hpp>
-#include <amgcl/mpi/direct_solver/runtime.hpp>
-#include <amgcl/mpi/partition/runtime.hpp>
+#include <boost/property_tree/ptree.hpp>
 
 namespace Kratos
 {
@@ -34,33 +17,8 @@ AMGCLScalarSolve(
     double& rResidual,
     const boost::property_tree::ptree &amgclParams,
     int verbosity_level,
-    bool /*use_opencl*/
-    )
-{
-    typedef amgcl::backend::builtin<double> Backend;
-
-    typedef
-        amgcl::mpi::make_solver<
-            amgcl::mpi::amg<
-                Backend,
-                amgcl::runtime::mpi::coarsening::wrapper<Backend>,
-                amgcl::runtime::mpi::relaxation::wrapper<Backend>,
-                amgcl::runtime::mpi::direct::solver<double>,
-                amgcl::runtime::mpi::partition::wrapper<Backend>
-                >,
-            amgcl::runtime::solver::wrapper
-            >
-        Solver;
-
-    Solver solve(MPI_COMM_WORLD, amgcl::adapter::map(rA), amgclParams);
-
-    std::size_t n = rA.NumMyRows();
-
-    auto b_range = boost::make_iterator_range(rB.Values(), rB.Values() + n);
-    auto x_range = boost::make_iterator_range(rX.Values(), rX.Values() + n);
-
-    std::tie(rIterationNumber, rResidual) = solve(b_range, x_range);
-}
+    bool use_opencl
+    );
 
 // Spacialization of AMGCLBlockSolve for distribued systems.
 template <int TBlockSize, class TSparseSpaceType>
@@ -73,44 +31,8 @@ AMGCLBlockSolve(
     double& rResidual,
     boost::property_tree::ptree amgclParams,
     int verbosity_level,
-    bool /*use_opencl*/
-    )
-{
-    amgclParams.put("precond.coarsening.aggr.block_size",1);
-
-    typedef amgcl::static_matrix<double, TBlockSize, TBlockSize> val_type;
-    typedef amgcl::static_matrix<double, TBlockSize, 1> rhs_type;
-    typedef amgcl::backend::builtin<val_type> Backend;
-
-    std::size_t n = rA.RowMap().NumMyElements();
-
-    typedef
-        amgcl::mpi::make_solver<
-            amgcl::mpi::amg<
-                Backend,
-                amgcl::runtime::mpi::coarsening::wrapper<Backend>,
-                amgcl::runtime::mpi::relaxation::wrapper<Backend>,
-                amgcl::runtime::mpi::direct::solver<val_type>,
-                amgcl::runtime::mpi::partition::wrapper<Backend>
-                >,
-            amgcl::runtime::solver::wrapper
-            >
-        Solver;
-
-    Solver solve(
-            MPI_COMM_WORLD,
-            amgcl::adapter::block_matrix<val_type>(amgcl::adapter::map(rA)),
-            amgclParams
-            );
-
-    auto b_begin = reinterpret_cast<const rhs_type*>(rB.Values());
-    auto x_begin = reinterpret_cast<rhs_type*>(rX.Values());
-
-    auto b_range = boost::make_iterator_range(b_begin, b_begin + n / TBlockSize);
-    auto x_range = boost::make_iterator_range(x_begin, x_begin + n / TBlockSize);
-
-    std::tie(rIterationNumber, rResidual) = solve(b_range, x_range);
-}
+    bool use_opencl
+    );
 
 } // namespace Kratos
 
diff --git a/external_libraries/amgcl/adapter/epetra.hpp b/external_libraries/amgcl/adapter/epetra.hpp
@@ -38,6 +38,7 @@ THE SOFTWARE.
 #include <Epetra_CrsMatrix.h>
 #include <Epetra_IntVector.h>
 #include <Epetra_Import.h>
+#include <Epetra_Comm.h>
 
 #include <amgcl/backend/interface.hpp>
 

Original file line number	Diff line number	Diff line change
`@@ -50,6 +50,7 @@ set( KRATOS_TRILINOS_APPLICATION_SOURCES`
`50`	`50`	`${CMAKE_CURRENT_SOURCE_DIR}/custom_factories/trilinos_linear_solver_factory.cpp`
`51`	`51`	`${CMAKE_SOURCE_DIR}/applications/FluidDynamicsApplication/fluid_dynamics_application_variables.cpp #TODO: this should REALLY NOT BE HERE`
`52`	`52`	`${CMAKE_CURRENT_SOURCE_DIR}/custom_utilities/mpi_normal_calculation_utilities.cpp;`
	`53`	`+ ${CMAKE_CURRENT_SOURCE_DIR}/amgcl_mpi_solver_impl.cpp;`
`53`	`54`	`)`
`54`	`55`
`55`	`56`	`## Kratos tests sources. Enabled by default`