OpmGpuILU0.hpp
Go to the documentation of this file.
1/*
2 Copyright 2024 SINTEF AS
3
4 This file is part of the Open Porous Media project (OPM).
5
6 OPM is free software: you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation, either version 3 of the License, or
9 (at your option) any later version.
10
11 OPM is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with OPM. If not, see <http://www.gnu.org/licenses/>.
18*/
19#ifndef OPM_GPUILU0_OPM_Impl_HPP
20#define OPM_GPUILU0_OPM_Impl_HPP
21
22#include <memory>
23#include <opm/grid/utility/SparseTable.hpp>
27#include <optional>
28#include <type_traits>
29#include <vector>
30
31
32namespace Opm::gpuistl
33{
44template <class M, class X, class Y, int l = 1>
46{
47public:
49 using matrix_type = typename std::remove_const<M>::type;
51 using domain_type = X;
53 using range_type = Y;
55 using field_type = typename X::field_type;
58
65 explicit OpmGpuILU0(const M& A, bool splitMatrix, bool tuneKernels);
66
69 void pre(X& x, Y& b) override;
70
72 void apply(X& v, const Y& d) override;
73
76 void post(X& x) override;
77
79 Dune::SolverCategory::Category category() const override;
80
82 void update() final;
83
85 void LUFactorizeAndMoveData(int moveThreadBlockSize, int factorizationThreadBlockSize);
86
89
91 static constexpr bool shouldCallPre()
92 {
93 return false;
94 }
95
97 static constexpr bool shouldCallPost()
98 {
99 return false;
100 }
101
102 virtual bool hasPerfectUpdate() const override {
103 return true;
104 }
105
106
107private:
109 void apply(X& v, const Y& d, int lowerSolveThreadBlockSize, int upperSolveThreadBlockSize);
111 void update(int moveThreadBlockSize, int factorizationThreadBlockSize);
113 const M& m_cpuMatrix;
115 static constexpr const size_t blocksize_ = matrix_type::block_type::cols;
117 Opm::SparseTable<size_t> m_levelSets;
119 std::vector<int> m_reorderedToNatural;
121 std::vector<int> m_naturalToReordered;
123 CuMat m_gpuMatrix;
124 std::unique_ptr<CuMat> m_gpuReorderedLU;
126 std::unique_ptr<CuMat> m_gpuMatrixReorderedLower;
127 std::unique_ptr<CuMat> m_gpuMatrixReorderedUpper;
129 std::optional<GpuVector<field_type>> m_gpuMatrixReorderedDiag;
131 GpuVector<int> m_gpuNaturalToReorder;
133 GpuVector<int> m_gpuReorderToNatural;
135 GpuVector<field_type> m_gpuDInv;
137 bool m_splitMatrix;
139 bool m_tuneThreadBlockSizes;
142 int m_upperSolveThreadBlockSize = -1;
143 int m_lowerSolveThreadBlockSize = -1;
144 int m_moveThreadBlockSize = -1;
145 int m_ILU0FactorizationThreadBlockSize = -1;
146};
147} // end namespace Opm::gpuistl
148
149#endif
Interface class adding the update() method to the preconditioner interface.
Definition: PreconditionerWithUpdate.hpp:32
ILU0 preconditioner on the GPU.
Definition: OpmGpuILU0.hpp:46
static constexpr bool shouldCallPost()
Definition: OpmGpuILU0.hpp:97
Y range_type
The range type of the preconditioner.
Definition: OpmGpuILU0.hpp:53
void pre(X &x, Y &b) override
Prepare the preconditioner.
void update() final
Updates the matrix data.
void apply(X &v, const Y &d) override
Apply the preconditoner.
GpuSparseMatrix< field_type > CuMat
The GPU matrix type.
Definition: OpmGpuILU0.hpp:57
OpmGpuILU0(const M &A, bool splitMatrix, bool tuneKernels)
Constructor.
static constexpr bool shouldCallPre()
Definition: OpmGpuILU0.hpp:91
typename X::field_type field_type
The field type of the preconditioner.
Definition: OpmGpuILU0.hpp:55
void LUFactorizeAndMoveData(int moveThreadBlockSize, int factorizationThreadBlockSize)
Compute LU factorization, and update the data of the reordered matrix.
Dune::SolverCategory::Category category() const override
Category of the preconditioner (see SolverCategory::Category)
void post(X &x) override
Post processing.
void tuneThreadBlockSizes()
function that will experimentally tune the thread block sizes of the important cuda kernels
typename std::remove_const< M >::type matrix_type
The matrix type the preconditioner is for.
Definition: OpmGpuILU0.hpp:49
virtual bool hasPerfectUpdate() const override
Definition: OpmGpuILU0.hpp:102
X domain_type
The domain type of the preconditioner.
Definition: OpmGpuILU0.hpp:51
Definition: autotuner.hpp:29