Disable instruction fusion on Power8
[gromacs.git] / src / gromacs / linearalgebra / gmx_blas.h
blob991cf8b2e6b1ce8baaaf64f6c487a34afb9dcb6b
1 /*
2 * This file is part of the GROMACS molecular simulation package.
4 * Copyright (c) 1991-2000, University of Groningen, The Netherlands.
5 * Copyright (c) 2001-2008, The GROMACS development team.
6 * Copyright (c) 2012,2013,2014, by the GROMACS development team, led by
7 * Mark Abraham, David van der Spoel, Berk Hess, and Erik Lindahl,
8 * and including many others, as listed in the AUTHORS file in the
9 * top-level source directory and at http://www.gromacs.org.
11 * GROMACS is free software; you can redistribute it and/or
12 * modify it under the terms of the GNU Lesser General Public License
13 * as published by the Free Software Foundation; either version 2.1
14 * of the License, or (at your option) any later version.
16 * GROMACS is distributed in the hope that it will be useful,
17 * but WITHOUT ANY WARRANTY; without even the implied warranty of
18 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
19 * Lesser General Public License for more details.
21 * You should have received a copy of the GNU Lesser General Public
22 * License along with GROMACS; if not, see
23 * http://www.gnu.org/licenses, or write to the Free Software Foundation,
24 * Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
26 * If you want to redistribute modifications to GROMACS, please
27 * consider that scientific software is very special. Version
28 * control is crucial - bugs must be traceable. We will be happy to
29 * consider code for inclusion in the official distribution, but
30 * derived work must not be called official GROMACS. Details are found
31 * in the README & COPYING files - if they are missing, get the
32 * official version at http://www.gromacs.org.
34 * To help us fund GROMACS development, we humbly ask that you cite
35 * the research papers on the package. Check out http://www.gromacs.org.
37 /*! \internal \file
38 * \brief
39 * Header definitions for the standard BLAS library.
41 * This is the subset of BLAS routines used for the
42 * linear algebra operations in Gromacs.
43 * Do NOT use this for other purposes - we only provide this as a
44 * simple fallback/reference implementation when no optimized BLAS
45 * is present. If you need an implementation for your own code
46 * there are several much faster versions out there.
48 * All routines are compatible with the BLAS reference implementation,
49 * meaning they assume fortran-style matrix row/column organization.
51 * There is plenty of documentation for these routines available
52 * at http://www.netlib.org/blas , so there is no point in repeating
53 * it here.
55 #ifndef GMX_BLAS_H
56 #define GMX_BLAS_H
58 /*! \cond */
60 #include "config.h"
62 /* These are not required by this file, but by the internal BLAS
63 * implementation. In principle, they could be included in each file
64 * that requires them, but this is simpler. Since the header is internal
65 * to the linearyalgebra/ module, the added complexity may not be worth it. */
66 #include "gromacs/utility/basedefinitions.h"
67 #include "gromacs/utility/real.h"
69 #ifdef __cplusplus
70 extern "C" {
71 #endif
72 #if 0
74 #endif
76 /* Double precision versions */
77 double
78 F77_FUNC(dasum, DASUM) (int *n, double *dx, int *incx);
80 void
81 F77_FUNC(daxpy, DAXPY) (int *n, double *da, double *dx, int *incx, double *dy, int *incy);
83 void
84 F77_FUNC(dcopy, DCOPY) (int *n, double *dx, int *incx, double *dy, int *incy);
86 double
87 F77_FUNC(ddot, DDOT) (int *n, double *dx, int *incx, double *dy, int *incy);
89 void
90 F77_FUNC(dgemm, DGEMM) (const char *transa, const char *transb, int *m, int *n, int *k,
91 double *alpha, double *a, int *lda, double *b, int *ldb,
92 double *beta, double *c, int *ldc);
94 void
95 F77_FUNC(dgemv, DGEMV) (const char *trans, int *m, int *n, double *alpha, double *a, int *lda,
96 double *x, int *incx, double *beta, double *y, int *incy);
98 void
99 F77_FUNC(dger, DGER) (int *m, int *n, double *alpha, double *x, int *incx,
100 double *y, int *incy, double *a, int *lda);
102 double
103 F77_FUNC(dnrm2, DNRM2) (int *n, double *x, int *incx);
105 void
106 F77_FUNC(drot, DROT) (int *n, double *dx, int *incx,
107 double *dy, int *incy, double *c, double *s);
109 void
110 F77_FUNC(dscal, DSCAL) (int *n, double *fact, double *dx, int *incx);
112 void
113 F77_FUNC(dswap, DSWAP) (int *n, double *dx, int *incx, double *dy, int *incy);
115 void
116 F77_FUNC(dsymv, DSYMV) (const char *uplo, int *n, double *alpha, double *a, int *lda,
117 double *x, int *incx, double *beta, double *y, int *incy);
119 void
120 F77_FUNC(dsyr2, DSYR2) (const char *uplo, int *n, double *alpha, double *x, int *incx,
121 double *y, int *incy, double *a, int *lda);
123 void
124 F77_FUNC(dsyr2k, DSYR2K) (const char *uplo, const char *trans, int *n, int *k, double *alpha, double *a,
125 int *lda, double *b, int *ldb, double *beta, double *c, int *ldc);
127 void
128 F77_FUNC(dtrmm, DTRMM) (const char *side, const char *uplo, const char *transa, const char *diag, int *m, int *n,
129 double *alpha, double *a, int *lda, double *b, int *ldb);
131 void
132 F77_FUNC(dtrmv, DTRMV) (const char *uplo, const char *trans, const char *diag, int *n,
133 double *a, int *lda, double *x, int *incx);
135 void
136 F77_FUNC(dtrsm, DTRSM) (const char *side, const char *uplo, const char *transa, const char *diag, int *m, int *n,
137 double *alpha, double *a, int *lda, double *b, int *ldb);
140 F77_FUNC(idamax, IDAMAX) (int *n, double *dx, int *incx);
144 /* Single precision versions */
145 float
146 F77_FUNC(sasum, SASUM) (int *n, float *dx, int *incx);
148 void
149 F77_FUNC(saxpy, SAXPY) (int *n, float *da, float *dx, int *incx, float *dy, int *incy);
151 void
152 F77_FUNC(scopy, SCOPY) (int *n, float *dx, int *incx, float *dy, int *incy);
154 float
155 F77_FUNC(sdot, SDOT) (int *n, float *dx, int *incx, float *dy, int *incy);
157 void
158 F77_FUNC(sgemm, SGEMM) (const char *transa, const char *transb, int *m, int *n, int *k,
159 float *alpha, float *a, int *lda, float *b, int *ldb,
160 float *beta, float *c, int *ldc);
162 void
163 F77_FUNC(sgemv, SGEMV) (const char *trans, int *m, int *n, float *alpha, float *a, int *lda,
164 float *x, int *incx, float *beta, float *y, int *incy);
166 void
167 F77_FUNC(sger, SGER) (int *m, int *n, float *alpha, float *x, int *incx,
168 float *y, int *incy, float *a, int *lda);
170 float
171 F77_FUNC(snrm2, SNRM2) (int *n, float *x, int *incx);
173 void
174 F77_FUNC(srot, SROT) (int *n, float *dx, int *incx,
175 float *dy, int *incy, float *c, float *s);
177 void
178 F77_FUNC(sscal, SSCAL) (int *n, float *fact, float *dx, int *incx);
180 void
181 F77_FUNC(sswap, SSWAP) (int *n, float *dx, int *incx, float *dy, int *incy);
183 void
184 F77_FUNC(ssymv, SSYMV) (const char *uplo, int *n, float *alpha, float *a, int *lda,
185 float *x, int *incx, float *beta, float *y, int *incy);
187 void
188 F77_FUNC(ssyr2, SSYR2) (const char *uplo, int *n, float *alpha, float *x, int *incx,
189 float *y, int *incy, float *a, int *lda);
191 void
192 F77_FUNC(ssyr2k, SSYR2K) (const char *uplo, const char *trans, int *n, int *k, float *alpha, float *a,
193 int *lda, float *b, int *ldb, float *beta, float *c, int *ldc);
195 void
196 F77_FUNC(strmm, STRMM) (const char *side, const char *uplo, const char *transa, const char *diag, int *m, int *n,
197 float *alpha, float *a, int *lda, float *b, int *ldb);
199 void
200 F77_FUNC(strmv, STRMV) (const char *uplo, const char *trans, const char *diag, int *n,
201 float *a, int *lda, float *x, int *incx);
203 void
204 F77_FUNC(strsm, STRSM) (const char *side, const char *uplo, const char *transa, const char *diag, int *m, int *n,
205 float *alpha, float *a, int *lda, float *b, int *ldb);
208 F77_FUNC(isamax, ISAMAX) (int *n, float *dx, int *incx);
211 #ifdef __cplusplus
213 #endif
215 /*! \endcond */
217 #endif /* GMX_BLAS_H */