1 /**********************************************************************\
2 ______ __ __ _______ _______ __ __ __ __ __ ___
3 / || | | | | ____|| ____|| | | | | \ | | | |/ /
4 | ,----'| | | | | |__ | |__ | | | | | \| | | ' /
5 | | | | | | | __| | __| | | | | | . ` | | <
6 | `----.| `--' | | | | | | `----.| | | |\ | | . \
7 \______| \______/ |__| |__| |_______||__| |__| \__| |__|\__\
11 cufflink is a library for linking numerical methods based on Nvidia's
12 Compute Unified Device Architecture (CUDA™) C/C++ programming language
15 Please note that cufflink is not approved or endorsed by ESI-OpenCFD®
16 Limited, the owner of the OpenFOAM® and OpenCFD® trademarks and
17 producer of OpenFOAM® software.
19 The official web-site of OpenCFD® Limited is www.openfoam.com .
21 ------------------------------------------------------------------------
22 This file is part of cufflink.
24 cufflink is free software: you can redistribute it and/or modify
25 it under the terms of the GNU General Public License as published by
26 the Free Software Foundation, either version 3 of the License, or
27 (at your option) any later version.
29 cufflink is distributed in the hope that it will be useful,
30 but WITHOUT ANY WARRANTY; without even the implied warranty of
31 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
32 GNU General Public License for more details.
34 You should have received a copy of the GNU General Public License
35 along with cufflink. If not, see <http://www.gnu.org/licenses/>.
38 Daniel P. Combest. All rights reserved.
39 Modifications by Dominik Christ, Wikki Ltd.
42 diagonal preconditioned conjugate gradient
43 solver for symmetric Matrices using a CUSP CUDA™ based solver.
45 \**********************************************************************/
47 #include "cudaTypes.H"
50 #include <cusp/detail/config.h>
51 #include <cusp/verify.h>
52 #include <cusp/precond/ainv.h>
53 #include <cusp/coo_matrix.h>
54 #include <cusp/blas.h>
55 #include <cusp/multiply.h>
57 extern "C" void cgAinv
59 cuspEquationSystem* ces,
60 cudaSolverPerformance* solverPerf,
61 ValueType drop_tolerance,
68 #include "fillCOOMatrix.H"
71 // #include "cufflink/setGPUStorage.H"
73 if (solverPerf->debugCusp)
75 std::cout<<" Using Ainv preconditioner\n";
78 cusp::precond::bridson_ainv<ValueType, MemorySpace> M
87 // Start the krylov solver
88 assert(A.num_rows == A.num_cols); // sanity check
90 const size_t N = A.num_rows;
93 cusp::array1d<ValueType,MemorySpace> y(N);
94 cusp::array1d<ValueType,MemorySpace> z(N);
95 cusp::array1d<ValueType,MemorySpace> r(N);
96 cusp::array1d<ValueType,MemorySpace> p(N);
99 cusp::multiply(A, X, y);
101 // Define the normalization factor
102 ValueType normFactor = 1.0;
104 # include "buildNormFactor.H"
107 cusp::blas::axpby(B, y, r, ValueType(1), ValueType(-1));
110 cusp::multiply(M, r, z);
113 cusp::blas::copy(z, p);
116 ValueType rz = cusp::blas::dotc(r, z);
118 ValueType normR = cusp::blas::nrm2(r)/normFactor;
119 ValueType normR0 = normR; // Initial residual
120 solverPerf->iRes = normR0;
125 normR > (solverPerf->tol)
126 && count < (solverPerf->maxIter)
127 && normR/normR0 >= (solverPerf->relTol)
128 || count < solverPerf->minIter
132 cusp::multiply(A, p, y);
134 // alpha <- <r,z>/<y,p>
135 ValueType alpha = rz / cusp::blas::dotc(y, p);
137 // x <- x + alpha * p
138 cusp::blas::axpy(p, X, alpha);
140 // r <- r - alpha * y
141 cusp::blas::axpy(y, r, -alpha);
144 cusp::multiply(M, r, z);
146 ValueType rz_old = rz;
149 rz = cusp::blas::dotc(r, z);
151 // beta <- <r_{i+1},r_{i+1}>/<r,r>
152 ValueType beta = rz / rz_old;
154 // p <- r + beta*p should be p <- z + beta*p
155 cusp::blas::axpby(z, p, p, ValueType(1), beta);
157 normR = cusp::blas::nrm2(r)/normFactor;
161 // End the krylov solver
164 solverPerf->fRes = normR;
165 solverPerf->nIterations = count;
170 solverPerf->fRes<=solverPerf->tol
171 || solverPerf->fRes/solverPerf->iRes<=solverPerf->relTol
174 solverPerf->converged = true;
178 solverPerf->converged = false;
181 // Pass the solution vector back