src/gromacs/simd/simd.h

   1 /*
   2  * This file is part of the GROMACS molecular simulation package.
   3  *
   4  * Copyright (c) 2013,2014,2015, by the GROMACS development team, led by
   5  * Mark Abraham, David van der Spoel, Berk Hess, and Erik Lindahl,
   6  * and including many others, as listed in the AUTHORS file in the
   7  * top-level source directory and at http://www.gromacs.org.
   8  *
   9  * GROMACS is free software; you can redistribute it and/or
  10  * modify it under the terms of the GNU Lesser General Public License
  11  * as published by the Free Software Foundation; either version 2.1
  12  * of the License, or (at your option) any later version.
  13  *
  14  * GROMACS is distributed in the hope that it will be useful,
  15  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  16  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  17  * Lesser General Public License for more details.
  18  *
  19  * You should have received a copy of the GNU Lesser General Public
  20  * License along with GROMACS; if not, see
  21  * http://www.gnu.org/licenses, or write to the Free Software Foundation,
  22  * Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA.
  23  *
  24  * If you want to redistribute modifications to GROMACS, please
  25  * consider that scientific software is very special. Version
  26  * control is crucial - bugs must be traceable. We will be happy to
  27  * consider code for inclusion in the official distribution, but
  28  * derived work must not be called official GROMACS. Details are found
  29  * in the README & COPYING files - if they are missing, get the
  30  * official version at http://www.gromacs.org.
  31  *
  32  * To help us fund GROMACS development, we humbly ask that you cite
  33  * the research papers on the package. Check out http://www.gromacs.org.
  34  */
  35
  36 /*! \libinternal
  37  * \defgroup module_simd SIMD intrinsics interface (simd)
  38  * \ingroup group_utilitymodules
  39  *
  40  * \brief Provides an architecture-independent way of doing SIMD coding.
  41  *
  42  * Overview of the SIMD implementation is provided in \ref page_simd.
  43  * The details are documented in simd.h and the reference implementation
  44  * impl_reference.h.
  45  *
  46  * \author Erik Lindahl <erik.lindahl@scilifelab.se>
  47  */
  48
  49 #ifndef GMX_SIMD_SIMD_H
  50 #define GMX_SIMD_SIMD_H
  51
  52 /*! \libinternal \file
  53  *
  54  * \brief Definitions, capabilities, and wrappers for SIMD module.
  55  *
  56  * The macros in this file are intended to be used for writing
  57  * architecture-independent SIMD intrinsics code.
  58  * To support a new architecture, adding a new sub-include with macros here
  59  * should be (nearly) all that is needed.
  60  *
  61  * The defines in this top-level file will set default Gromacs real precision
  62  * operations to either single or double precision based on whether
  63  * GMX_DOUBLE is defined. The actual implementation - including e.g.
  64  * conversion operations specifically between single and double - is documented
  65  * in impl_reference.h.
  66  *
  67  * \author Erik Lindahl <erik.lindahl@scilifelab.se>
  68  *
  69  * \inlibraryapi
  70  * \ingroup module_simd
  71  */
  72
  73 #include "config.h"
  74
  75 #include <stddef.h>
  76
  77 #include "gromacs/utility/basedefinitions.h"
  78
  79 /* Forward declarations so memory allocation can be used in implementations */
  80 static gmx_inline float *  gmx_simd_align_f(float *p);
  81 static gmx_inline double * gmx_simd_align_d(double *p);
  82 static gmx_inline int *    gmx_simd_align_fi(int *p);
  83 static gmx_inline int *    gmx_simd_align_di(int *p);
  84 static gmx_inline float *  gmx_simd4_align_f(float *p);
  85 static gmx_inline double * gmx_simd4_align_d(double *p);
  86
  87 /*! \cond libapi */
  88 /*! \addtogroup module_simd */
  89 /*! \{ */
  90
  91 /*! \name SIMD predefined macros to describe high-level capabilities
  92  *
  93  *  These macros are used to describe the features available in default
  94  *  Gromacs real precision. They are set from the lower-level implementation
  95  *  files that have macros describing single and double precision individually,
  96  *  as well as the implementation details.
  97  *  \{
  98  */
  99
 100 /* Intel MIC is a bit special since it is a co-processor. This means the rest
 101  * of GROMACS (which runs on the CPU) can use a default SIMD set like AVX.
 102  * All functions in this SIMD module are static, so it will work perfectly fine
 103  * to include this file with different SIMD definitions for different files.
 104  */
 105 #if GMX_SIMD_X86_AVX_512ER
 106 #    include "impl_x86_avx_512er/impl_x86_avx_512er.h"
 107 #elif GMX_SIMD_X86_AVX_512F
 108 #    include "impl_x86_avx_512f/impl_x86_avx_512f.h"
 109 #elif GMX_SIMD_X86_MIC
 110 #    include "impl_intel_mic/impl_intel_mic.h"
 111 #elif GMX_SIMD_X86_AVX2_256
 112 #    include "impl_x86_avx2_256/impl_x86_avx2_256.h"
 113 #elif GMX_SIMD_X86_AVX_256
 114 #    include "impl_x86_avx_256/impl_x86_avx_256.h"
 115 #elif GMX_SIMD_X86_AVX_128_FMA
 116 #    include "impl_x86_avx_128_fma/impl_x86_avx_128_fma.h"
 117 #elif GMX_SIMD_X86_SSE4_1
 118 #    include "impl_x86_sse4_1/impl_x86_sse4_1.h"
 119 #elif GMX_SIMD_X86_SSE2
 120 #    include "impl_x86_sse2/impl_x86_sse2.h"
 121 #elif GMX_SIMD_ARM_NEON
 122 #    include "impl_arm_neon/impl_arm_neon.h"
 123 #elif GMX_SIMD_ARM_NEON_ASIMD
 124 #    include "impl_arm_neon_asimd/impl_arm_neon_asimd.h"
 125 #elif GMX_SIMD_IBM_QPX
 126 #    include "impl_ibm_qpx/impl_ibm_qpx.h"
 127 #elif GMX_SIMD_IBM_VMX
 128 #    include "impl_ibm_vmx/impl_ibm_vmx.h"
 129 #elif GMX_SIMD_IBM_VSX
 130 #    include "impl_ibm_vsx/impl_ibm_vsx.h"
 131 #elif GMX_SIMD_SPARC64_HPC_ACE
 132 #    include "impl_sparc64_hpc_ace/impl_sparc64_hpc_ace.h"
 133 #elif (GMX_SIMD_REFERENCE || defined DOXYGEN)
 134 /* Plain C SIMD reference implementation, also serves as documentation. */
 135 #    include "impl_reference/impl_reference.h"
 136 #else
 137 #    include "impl_none/impl_none.h"
 138 #endif
 139
 140 /* These convenience macros are ugly hacks where some source files still make
 141  * assumptions about the SIMD architecture. They will be removed as we implement
 142  * the new verlet kernels, but for now we need them, and to make sure they
 143  * always have values 0 or 1 we define them here rather than in the implementations.
 144  */
 145 #define GMX_SIMD_X86_AVX2_256_OR_HIGHER      (GMX_SIMD_X86_AVX2_256)
 146 #define GMX_SIMD_X86_AVX_256_OR_HIGHER       (GMX_SIMD_X86_AVX2_256_OR_HIGHER || GMX_SIMD_X86_AVX_256)
 147 #define GMX_SIMD_X86_AVX_128_FMA_OR_HIGHER   (GMX_SIMD_X86_AVX_128_FMA)
 148 #define GMX_SIMD_X86_SSE4_1_OR_HIGHER        (GMX_SIMD_X86_AVX_256_OR_HIGHER || GMX_SIMD_X86_AVX_128_FMA_OR_HIGHER || GMX_SIMD_X86_SSE4_1)
 149 #define GMX_SIMD_X86_SSE2_OR_HIGHER          (GMX_SIMD_X86_SSE4_1_OR_HIGHER || GMX_SIMD_X86_SSE2)
 150
 151 /*! \} */
 152
 153 /*! \name SIMD memory alignment operations
 154  *  \{
 155  */
 156
 157 /*! \brief
 158  * Align a float pointer for usage with SIMD instructions.
 159  *
 160  * You should typically \a not call this function directly (unless you explicitly
 161  * want single precision even when GMX_DOUBLE is set), but use the
 162  * \ref gmx_simd_align_r macro to align memory in default Gromacs real precision.
 163  *
 164  * \param  p Pointer to memory, allocate at least \ref GMX_SIMD_FLOAT_WIDTH extra elements.
 165  *
 166  * \return Aligned pointer (>=p) suitable for loading/storing float fp SIMD.
 167  *         If \ref GMX_SIMD_HAVE_FLOAT is not set, p will be returned unchanged.
 168  *
 169  * Start by allocating an extra \ref GMX_SIMD_FLOAT_WIDTH float elements of memory,
 170  * and then call this function. The returned pointer will be greater or equal
 171  * to the one you provided, and point to an address inside your provided memory
 172  * that is aligned to the SIMD width.
 173  */
 174 static gmx_inline float *
 175 gmx_simd_align_f(float *p)
 176 {
 177 #if GMX_SIMD_HAVE_FLOAT
 178     return (float *)(((size_t)((p)+GMX_SIMD_FLOAT_WIDTH-1)) & (~((size_t)(GMX_SIMD_FLOAT_WIDTH*sizeof(float)-1))));
 179 #else
 180     return p;
 181 #endif
 182 }
 183
 184 /*!  \brief
 185  * Align a double pointer for usage with SIMD instructions.
 186  *
 187  * You should typically \a not call this function directly (unless you explicitly
 188  * want double precision even when GMX_DOUBLE is not set), but use the
 189  * \ref gmx_simd_align_r macro to align memory in default Gromacs real precision.
 190  *
 191  * \param  p Pointer to memory, allocate at least \ref GMX_SIMD_DOUBLE_WIDTH extra elements.
 192  *
 193  * \return Aligned pointer (>=p) suitable for loading/storing double fp SIMD.
 194  *         If \ref GMX_SIMD_HAVE_DOUBLE is not set, p will be returned unchanged.
 195  *
 196  * Start by allocating an extra \ref GMX_SIMD_DOUBLE_WIDTH double elements of memory,
 197  * and then call this function. The returned pointer will be greater or equal
 198  * to the one you provided, and point to an address inside your provided memory
 199  * that is aligned to the SIMD width.
 200  */
 201 static gmx_inline double *
 202 gmx_simd_align_d(double *p)
 203 {
 204 #if GMX_SIMD_HAVE_DOUBLE
 205     return (double *)(((size_t)((p)+GMX_SIMD_DOUBLE_WIDTH-1)) & (~((size_t)(GMX_SIMD_DOUBLE_WIDTH*sizeof(double)-1))));
 206 #else
 207     return p;
 208 #endif
 209 }
 210
 211 /*! \brief
 212  * Align a (float) integer pointer for usage with SIMD instructions.
 213  *
 214  * You should typically \a not call this function directly (unless you explicitly
 215  * want integers corresponding to single precision even when GMX_DOUBLE is
 216  * set), but use the \ref gmx_simd_align_i macro to align integer memory
 217  * corresponding to Gromacs default floating-point precision.
 218  *
 219  * \param  p Pointer to memory, allocate at least \ref GMX_SIMD_FINT32_WIDTH extra elements.
 220  *
 221  * \return Aligned pointer (>=p) suitable for loading/storing float-integer SIMD.
 222  *         If \ref GMX_SIMD_HAVE_FINT32 is not set, p will be returned unchanged.
 223  *
 224  * This routine provides aligned memory for usage with \ref gmx_simd_fint32_t. You
 225  * should have allocated an extra \ref GMX_SIMD_FINT32_WIDTH * sizeof(int) bytes. The
 226  * reason why we need to separate float-integer vs. double-integer is that the
 227  * width of registers after conversions from the floating-point types might not
 228  * be identical, or even supported, in both cases.
 229  */
 230 static gmx_inline int *
 231 gmx_simd_align_fi(int *p)
 232 {
 233 #if GMX_SIMD_HAVE_FINT32
 234     return (int *)(((size_t)((p)+GMX_SIMD_FINT32_WIDTH-1)) & (~((size_t)(GMX_SIMD_FINT32_WIDTH*sizeof(int)-1))));
 235 #else
 236     return p;
 237 #endif
 238 }
 239
 240 /*! \brief
 241  * Align a (double) integer pointer for usage with SIMD instructions.
 242  *
 243  * You should typically \a not call this function directly (unless you explicitly
 244  * want integers corresponding to doublele precision even when GMX_DOUBLE is
 245  * not set), but use the \ref gmx_simd_align_i macro to align integer memory
 246  * corresponding to Gromacs default floating-point precision.
 247  *
 248  * \param  p Pointer to memory, allocate at least \ref GMX_SIMD_DINT32_WIDTH extra elements.
 249  *
 250  * \return Aligned pointer (>=p) suitable for loading/storing double-integer SIMD.
 251  *         If \ref GMX_SIMD_HAVE_DINT32 is not set, p will be returned unchanged.
 252  *
 253  * This routine provides aligned memory for usage with \ref gmx_simd_dint32_t. You
 254  * should have allocated an extra \ref GMX_SIMD_DINT32_WIDTH*sizeof(int) bytes. The
 255  * reason why we need to separate float-integer vs. double-integer is that the
 256  * width of registers after conversions from the floating-point types might not
 257  * be identical, or even supported, in both cases.
 258  */
 259 static gmx_inline int *
 260 gmx_simd_align_di(int *p)
 261 {
 262 #if GMX_SIMD_HAVE_DINT32
 263     return (int *)(((size_t)((p)+GMX_SIMD_DINT32_WIDTH-1)) & (~((size_t)(GMX_SIMD_DINT32_WIDTH*sizeof(int)-1))));
 264 #else
 265     return p;
 266 #endif
 267 }
 268
 269 /*! \brief
 270  * Align a float pointer for usage with SIMD4 instructions.
 271  *
 272  * You should typically \a not call this function directly (unless you explicitly
 273  * want single precision even when GMX_DOUBLE is set), but use the
 274  * \ref gmx_simd4_align_r macro to align memory in default Gromacs real precision.
 275  *
 276  * \param  p Pointer to memory, allocate at least \ref GMX_SIMD4_WIDTH extra elements.
 277  *
 278  * \return Aligned pointer (>=p) suitable for loading/storing float SIMD.
 279  *         If \ref GMX_SIMD4_HAVE_FLOAT is not set, p will be returned unchanged.
 280  *
 281  * This routine provides aligned memory for usage with \ref gmx_simd4_float_t.
 282  * should have allocated an extra \ref GMX_SIMD4_WIDTH * sizeof(float) bytes.
 283  */
 284 static gmx_inline float *
 285 gmx_simd4_align_f(float *p)
 286 {
 287 #if GMX_SIMD4_HAVE_FLOAT
 288     return (float *)(((size_t)((p)+GMX_SIMD4_WIDTH-1)) & (~((size_t)(GMX_SIMD4_WIDTH*sizeof(float)-1))));
 289 #else
 290     return p;
 291 #endif
 292 }
 293
 294 /*! \brief
 295  * Align a double pointer for usage with SIMD4 instructions.
 296  *
 297  * You should typically \a not call this function directly (unless you explicitly
 298  * want double precision even when GMX_DOUBLE is not set), but use the
 299  * \ref gmx_simd4_align_r macro to align memory in default Gromacs real precision.
 300  *
 301  * \param  p Pointer to memory, allocate at least \ref GMX_SIMD4_WIDTH extra elements.
 302  *
 303  * \return Aligned pointer (>=p) suitable for loading/storing float SIMD.
 304  *         If \ref GMX_SIMD4_HAVE_DOUBLE is not set, p will be returned unchanged.
 305  *
 306  * This routine provides aligned memory for usage with \ref gmx_simd4_double_t.
 307  * should have allocated an extra \ref GMX_SIMD4_WIDTH * sizeof(double) bytes.
 308  */
 309 static gmx_inline double *
 310 gmx_simd4_align_d(double *p)
 311 {
 312 #if GMX_SIMD4_HAVE_DOUBLE
 313     return (double *)(((size_t)((p)+GMX_SIMD4_WIDTH-1)) & (~((size_t)(GMX_SIMD4_WIDTH*sizeof(double)-1))));
 314 #else
 315     return p;
 316 #endif
 317 }
 318
 319 /*! \} */
 320
 321
 322 /* Define Gromacs "real" precision macros depending on Gromacs config. Note
 323  * that conversions float-to-double and v.v. are not included here since they
 324  * are not precision-dependent - find them in the implementation files.
 325  */
 326 #ifdef GMX_DOUBLE
 327 /* Double floating-point. The documentation is in the float part below */
 328 #    define gmx_simd_real_t                  gmx_simd_double_t
 329 #    define gmx_simd_load_r                  gmx_simd_load_d
 330 #    define gmx_simd_load1_r                 gmx_simd_load1_d
 331 #    define gmx_simd_set1_r                  gmx_simd_set1_d
 332 #    define gmx_simd_store_r                 gmx_simd_store_d
 333 #    define gmx_simd_loadu_r                 gmx_simd_loadu_d
 334 #    define gmx_simd_storeu_r                gmx_simd_storeu_d
 335 #    define gmx_simd_setzero_r               gmx_simd_setzero_d
 336 #    define gmx_simd_add_r                   gmx_simd_add_d
 337 #    define gmx_simd_sub_r                   gmx_simd_sub_d
 338 #    define gmx_simd_mul_r                   gmx_simd_mul_d
 339 #    define gmx_simd_fmadd_r                 gmx_simd_fmadd_d
 340 #    define gmx_simd_fmsub_r                 gmx_simd_fmsub_d
 341 #    define gmx_simd_fnmadd_r                gmx_simd_fnmadd_d
 342 #    define gmx_simd_fnmsub_r                gmx_simd_fnmsub_d
 343 #    define gmx_simd_and_r                   gmx_simd_and_d
 344 #    define gmx_simd_andnot_r                gmx_simd_andnot_d
 345 #    define gmx_simd_or_r                    gmx_simd_or_d
 346 #    define gmx_simd_xor_r                   gmx_simd_xor_d
 347 #    define gmx_simd_rsqrt_r                 gmx_simd_rsqrt_d
 348 #    define gmx_simd_rcp_r                   gmx_simd_rcp_d
 349 #    define gmx_simd_fabs_r                  gmx_simd_fabs_d
 350 #    define gmx_simd_fneg_r                  gmx_simd_fneg_d
 351 #    define gmx_simd_max_r                   gmx_simd_max_d
 352 #    define gmx_simd_min_r                   gmx_simd_min_d
 353 #    define gmx_simd_round_r                 gmx_simd_round_d
 354 #    define gmx_simd_trunc_r                 gmx_simd_trunc_d
 355 #    define gmx_simd_fraction_r              gmx_simd_fraction_d
 356 #    define gmx_simd_get_exponent_r          gmx_simd_get_exponent_d
 357 #    define gmx_simd_get_mantissa_r          gmx_simd_get_mantissa_d
 358 #    define gmx_simd_set_exponent_r          gmx_simd_set_exponent_d
 359 /* Double integer and conversions */
 360 #    define gmx_simd_int32_t                 gmx_simd_dint32_t
 361 #    define gmx_simd_load_i                  gmx_simd_load_di
 362 #    define gmx_simd_set1_i                  gmx_simd_set1_di
 363 #    define gmx_simd_store_i                 gmx_simd_store_di
 364 #    define gmx_simd_loadu_i                 gmx_simd_loadu_di
 365 #    define gmx_simd_storeu_i                gmx_simd_storeu_di
 366 #    define gmx_simd_setzero_i               gmx_simd_setzero_di
 367 #    define gmx_simd_cvt_r2i                 gmx_simd_cvt_d2i
 368 #    define gmx_simd_cvtt_r2i                gmx_simd_cvtt_d2i
 369 #    define gmx_simd_cvt_i2r                 gmx_simd_cvt_i2d
 370 #    define gmx_simd_extract_i               gmx_simd_extract_di
 371 #    define gmx_simd_slli_i                  gmx_simd_slli_di
 372 #    define gmx_simd_srli_i                  gmx_simd_srli_di
 373 #    define gmx_simd_and_i                   gmx_simd_and_di
 374 #    define gmx_simd_andnot_i                gmx_simd_andnot_di
 375 #    define gmx_simd_or_i                    gmx_simd_or_di
 376 #    define gmx_simd_xor_i                   gmx_simd_xor_di
 377 #    define gmx_simd_add_i                   gmx_simd_add_di
 378 #    define gmx_simd_sub_i                   gmx_simd_sub_di
 379 #    define gmx_simd_mul_i                   gmx_simd_mul_di
 380 /* Double booleans and selection */
 381 #    define gmx_simd_bool_t                  gmx_simd_dbool_t
 382 #    define gmx_simd_cmpeq_r                 gmx_simd_cmpeq_d
 383 #    define gmx_simd_cmplt_r                 gmx_simd_cmplt_d
 384 #    define gmx_simd_cmple_r                 gmx_simd_cmple_d
 385 #    define gmx_simd_and_b                   gmx_simd_and_db
 386 #    define gmx_simd_or_b                    gmx_simd_or_db
 387 #    define gmx_simd_anytrue_b               gmx_simd_anytrue_db
 388 #    define gmx_simd_blendzero_r             gmx_simd_blendzero_d
 389 #    define gmx_simd_blendnotzero_r          gmx_simd_blendnotzero_d
 390 #    define gmx_simd_blendv_r                gmx_simd_blendv_d
 391 #    define gmx_simd_reduce_r                gmx_simd_reduce_d
 392 #    define gmx_simd_ibool_t                 gmx_simd_dibool_t
 393 #    define gmx_simd_cmpeq_i                 gmx_simd_cmpeq_di
 394 #    define gmx_simd_cmplt_i                 gmx_simd_cmplt_di
 395 #    define gmx_simd_and_ib                  gmx_simd_and_dib
 396 #    define gmx_simd_or_ib                   gmx_simd_or_dib
 397 #    define gmx_simd_anytrue_ib              gmx_simd_anytrue_dib
 398 #    define gmx_simd_blendzero_i             gmx_simd_blendzero_di
 399 #    define gmx_simd_blendnotzero_i          gmx_simd_blendnotzero_di
 400 #    define gmx_simd_blendv_i                gmx_simd_blendv_di
 401 /* Conversions between integer and double floating-point booleans */
 402 #    define gmx_simd_cvt_b2ib                gmx_simd_cvt_db2dib
 403 #    define gmx_simd_cvt_ib2b                gmx_simd_cvt_dib2db
 404
 405 /* SIMD4 double fp - we only support a subset of SIMD instructions for SIMD4 */
 406 #    define gmx_simd4_real_t                 gmx_simd4_double_t
 407 #    define gmx_simd4_load_r                 gmx_simd4_load_d
 408 #    define gmx_simd4_load1_r                gmx_simd4_load1_d
 409 #    define gmx_simd4_set1_r                 gmx_simd4_set1_d
 410 #    define gmx_simd4_store_r                gmx_simd4_store_d
 411 #    define gmx_simd4_loadu_r                gmx_simd4_loadu_d
 412 #    define gmx_simd4_storeu_r               gmx_simd4_storeu_d
 413 #    define gmx_simd4_setzero_r              gmx_simd4_setzero_d
 414 #    define gmx_simd4_add_r                  gmx_simd4_add_d
 415 #    define gmx_simd4_sub_r                  gmx_simd4_sub_d
 416 #    define gmx_simd4_mul_r                  gmx_simd4_mul_d
 417 #    define gmx_simd4_fmadd_r                gmx_simd4_fmadd_d
 418 #    define gmx_simd4_fmsub_r                gmx_simd4_fmsub_d
 419 #    define gmx_simd4_fnmadd_r               gmx_simd4_fnmadd_d
 420 #    define gmx_simd4_fnmsub_r               gmx_simd4_fnmsub_d
 421 #    define gmx_simd4_and_r                  gmx_simd4_and_d
 422 #    define gmx_simd4_andnot_r               gmx_simd4_andnot_d
 423 #    define gmx_simd4_or_r                   gmx_simd4_or_d
 424 #    define gmx_simd4_xor_r                  gmx_simd4_xor_d
 425 #    define gmx_simd4_rsqrt_r                gmx_simd4_rsqrt_d
 426 #    define gmx_simd4_fabs_r                 gmx_simd4_fabs_d
 427 #    define gmx_simd4_fneg_r                 gmx_simd4_fneg_d
 428 #    define gmx_simd4_max_r                  gmx_simd4_max_d
 429 #    define gmx_simd4_min_r                  gmx_simd4_min_d
 430 #    define gmx_simd4_round_r                gmx_simd4_round_d
 431 #    define gmx_simd4_trunc_r                gmx_simd4_trunc_d
 432 #    define gmx_simd4_dotproduct3_r          gmx_simd4_dotproduct3_d
 433 #    define gmx_simd4_bool_t                 gmx_simd4_dbool_t
 434 #    define gmx_simd4_cmpeq_r                gmx_simd4_cmpeq_d
 435 #    define gmx_simd4_cmplt_r                gmx_simd4_cmplt_d
 436 #    define gmx_simd4_cmple_r                gmx_simd4_cmple_d
 437 #    define gmx_simd4_and_b                  gmx_simd4_and_db
 438 #    define gmx_simd4_or_b                   gmx_simd4_or_db
 439 #    define gmx_simd4_anytrue_b              gmx_simd4_anytrue_db
 440 #    define gmx_simd4_blendzero_r            gmx_simd4_blendzero_d
 441 #    define gmx_simd4_blendnotzero_r         gmx_simd4_blendnotzero_d
 442 #    define gmx_simd4_blendv_r               gmx_simd4_blendv_d
 443 #    define gmx_simd4_reduce_r               gmx_simd4_reduce_d
 444
 445 /* Memory allocation */
 446 #    define gmx_simd_align_r                 gmx_simd_align_d
 447 #    define gmx_simd_align_i                 gmx_simd_align_di
 448 #    define gmx_simd4_align_r                gmx_simd4_align_d
 449
 450 #    define GMX_SIMD_HAVE_REAL               GMX_SIMD_HAVE_DOUBLE
 451 #    define GMX_SIMD_REAL_WIDTH              GMX_SIMD_DOUBLE_WIDTH
 452 #    define GMX_SIMD_HAVE_INT32              GMX_SIMD_HAVE_DINT32
 453 #    define GMX_SIMD_INT32_WIDTH             GMX_SIMD_DINT32_WIDTH
 454 #    define GMX_SIMD_HAVE_INT32_EXTRACT      GMX_SIMD_HAVE_DINT32_EXTRACT
 455 #    define GMX_SIMD_HAVE_INT32_LOGICAL      GMX_SIMD_HAVE_DINT32_LOGICAL
 456 #    define GMX_SIMD_HAVE_INT32_ARITHMETICS  GMX_SIMD_HAVE_DINT32_ARITHMETICS
 457 #    define GMX_SIMD4_HAVE_REAL              GMX_SIMD4_HAVE_DOUBLE
 458
 459 #else /* GMX_DOUBLE */
 460
 461 /*! \name SIMD data types
 462  *
 463  *  The actual storage of these types is implementation dependent. The
 464  *  documentation is generated from the reference implementation, but for
 465  *  normal usage this will likely not be what you are using.
 466  * \{
 467  */
 468 /*! \brief Real precision floating-point SIMD datatype.
 469  *
 470  * This type is only available if \ref GMX_SIMD_HAVE_REAL is 1.
 471  *
 472  * If GMX_DOUBLE is defined, this will be set to \ref gmx_simd_double_t
 473  * internally, otherwise \ref gmx_simd_float_t.
 474  */
 475 #    define gmx_simd_real_t                  gmx_simd_float_t
 476
 477 /*! \brief 32-bit integer SIMD type.
 478  *
 479  * This type is only available if \ref GMX_SIMD_HAVE_INT32 is 1.
 480  *
 481  * If GMX_DOUBLE is defined, this will be set to \ref gmx_simd_dint32_t
 482  * internally, otherwise \ref gmx_simd_fint32_t. This might seem a strange
 483  * implementation detail, but it is because some SIMD implementations use
 484  * different types/widths of integers registers when converting from
 485  * double vs. single precision floating point. As long as you just use
 486  * this type you will not have to worry about precision.
 487  */
 488 #    define gmx_simd_int32_t                 gmx_simd_fint32_t
 489
 490 /*! \brief Boolean SIMD type for usage with \ref gmx_simd_real_t.
 491  *
 492  * This type is only available if \ref GMX_SIMD_HAVE_REAL is 1.
 493  *
 494  * If GMX_DOUBLE is defined, this will be set to \ref gmx_simd_dbool_t
 495  * internally, otherwise \ref gmx_simd_fbool_t. This is necessary since some
 496  * SIMD implementations use bitpatterns for marking truth, so single-
 497  * vs. double precision booleans are not necessarily exchangable.
 498  * As long as you just use this type you will not have to worry about precision.
 499  *
 500  * See \ref gmx_simd_ibool_t for an explanation of real vs. integer booleans.
 501  */
 502 #    define gmx_simd_bool_t                  gmx_simd_fbool_t
 503
 504 /*! \brief Boolean SIMD type for usage with \ref gmx_simd_int32_t.
 505  *
 506  * This type is only available if \ref GMX_SIMD_HAVE_INT32 is 1.
 507  *
 508  * If GMX_DOUBLE is defined, this will be set to \ref gmx_simd_dibool_t
 509  * internally, otherwise \ref gmx_simd_fibool_t. This is necessary since some
 510  * SIMD implementations use bitpatterns for marking truth, so single-
 511  * vs. double precision booleans are not necessarily exchangable, and while
 512  * a double-precision boolean might be represented with a 64-bit mask, the
 513  * corresponding integer might only use a 32-bit mask.
 514  *
 515  * We provide conversion routines for these cases, so the only thing you need to
 516  * keep in mind is to use \ref gmx_simd_bool_t when working with
 517  * \ref gmx_simd_real_t while you pick \ref gmx_simd_ibool_t when working with
 518  * \ref gmx_simd_int32_t.
 519  *
 520  * To convert between them, use \ref gmx_simd_cvt_b2ib and \ref gmx_simd_cvt_ib2b.
 521  */
 522 #    define gmx_simd_ibool_t                 gmx_simd_fibool_t
 523
 524
 525 /*! \}
 526  *  \name SIMD load/store operations on gmx_simd_real_t
 527  *
 528  *  \note Unaligned load/stores are only available when
 529  *  \ref GMX_SIMD_HAVE_LOADU and \ref GMX_SIMD_HAVE_STOREU are set, respectively.
 530  *  \{
 531  */
 532
 533 /*! \brief Load \ref GMX_SIMD_REAL_WIDTH values from aligned memory to \ref gmx_simd_real_t
 534  *
 535  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_load_d,
 536  * otherwise \ref gmx_simd_load_f.
 537  *
 538  * \copydetails gmx_simd_load_f
 539  */
 540 #    define gmx_simd_load_r                  gmx_simd_load_f
 541
 542 /*! \brief Set all elements in \ref gmx_simd_real_t from single value in memory.
 543  *
 544  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_load1_d,
 545  * otherwise \ref gmx_simd_load1_f.
 546  *
 547  * \copydetails gmx_simd_load1_f
 548  */
 549 #    define gmx_simd_load1_r                 gmx_simd_load1_f
 550
 551 /*! \brief Set all elements in \ref gmx_simd_real_t from a scalar.
 552  *
 553  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_set1_d,
 554  * otherwise \ref gmx_simd_set1_f.
 555  *
 556  * \copydetails gmx_simd_set1_f
 557  */
 558 #    define gmx_simd_set1_r                  gmx_simd_set1_f
 559
 560 /*! \brief Store \ref GMX_SIMD_REAL_WIDTH values from \ref gmx_simd_real_t to aligned memory.
 561  *
 562  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_store_d,
 563  * otherwise \ref gmx_simd_store_f.
 564  *
 565  * \copydetails gmx_simd_store_f
 566  */
 567 #    define gmx_simd_store_r                 gmx_simd_store_f
 568
 569 /*! \brief Load \ref GMX_SIMD_REAL_WIDTH values from unaligned memory to \ref gmx_simd_real_t.
 570  *
 571  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_loadu_d,
 572  * otherwise \ref gmx_simd_loadu_f.
 573  *
 574  * \copydetails gmx_simd_loadu_f
 575  */
 576 #    define gmx_simd_loadu_r                 gmx_simd_loadu_f
 577
 578 /*! \brief Store \ref GMX_SIMD_REAL_WIDTH values from \ref gmx_simd_real_t to unaligned memory.
 579  *
 580  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_storeu_d,
 581  * otherwise \ref gmx_simd_storeu_f.
 582  *
 583  * \copydetails gmx_simd_storeu_f
 584  */
 585 #    define gmx_simd_storeu_r                gmx_simd_storeu_f
 586
 587 /*! \brief Set all elements in \ref gmx_simd_real_t to 0.0.
 588  *
 589  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_setzero_d,
 590  * otherwise \ref gmx_simd_setzero_f.
 591  *
 592  * \copydetails gmx_simd_setzero_f
 593  */
 594 #    define gmx_simd_setzero_r               gmx_simd_setzero_f
 595
 596 /*! \}
 597  *  \name SIMD load/store operations on gmx_simd_int32_t
 598  *
 599  *  \note Unaligned load/stores are only available when
 600  *  \ref GMX_SIMD_HAVE_LOADU and \ref GMX_SIMD_HAVE_STOREU are set, respectively.
 601  *  \{
 602  */
 603
 604 /*! \brief Load \ref GMX_SIMD_INT32_WIDTH values from aligned memory to \ref gmx_simd_int32_t .
 605  *
 606  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_load_di ,
 607  * otherwise \ref gmx_simd_load_fi .
 608  *
 609  * \copydetails gmx_simd_load_fi
 610  */
 611 #    define gmx_simd_load_i                  gmx_simd_load_fi
 612
 613 /*! \brief Set all elements in \ref gmx_simd_int32_t from a single integer.
 614  *
 615  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_set1_di ,
 616  * otherwise \ref gmx_simd_set1_fi .
 617  *
 618  * \copydetails gmx_simd_set1_fi
 619  */
 620 #    define gmx_simd_set1_i                  gmx_simd_set1_fi
 621
 622 /*! \brief Store \ref GMX_SIMD_REAL_WIDTH values from \ref gmx_simd_int32_t to aligned memory.
 623  *
 624  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_store_di ,
 625  * otherwise \ref gmx_simd_store_fi .
 626  *
 627  * \copydetails gmx_simd_store_fi
 628  */
 629 #    define gmx_simd_store_i                 gmx_simd_store_fi
 630
 631 /*! \brief Load \ref GMX_SIMD_REAL_WIDTH values from unaligned memory to \ref gmx_simd_int32_t.
 632  *
 633  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_loadu_di ,
 634  * otherwise \ref gmx_simd_loadu_fi .
 635  *
 636  * \copydetails gmx_simd_loadu_fi
 637  */
 638 #    define gmx_simd_loadu_i                 gmx_simd_loadu_fi
 639
 640 /*! \brief Store \ref GMX_SIMD_REAL_WIDTH values from \ref gmx_simd_int32_t to unaligned memory.
 641  *
 642  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_storeu_di ,
 643  * otherwise \ref gmx_simd_storeu_fi .
 644  *
 645  * \copydetails gmx_simd_storeu_fi
 646  */
 647 #    define gmx_simd_storeu_i                gmx_simd_storeu_fi
 648
 649 /*! \brief Extract single integer from \ref gmx_simd_int32_t element.
 650  *
 651  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_extract_di ,
 652  * otherwise \ref gmx_simd_extract_fi .
 653  *
 654  * \copydetails gmx_simd_extract_fi
 655  */
 656 #    define gmx_simd_extract_i               gmx_simd_extract_fi
 657
 658 /*! \brief Set all elements in \ref gmx_simd_int32_t to 0.
 659  *
 660  * If GMX_DOUBLE is defined, it will be aliased to \ref gmx_simd_setzero_di ,
 661  * otherwise \ref gmx_simd_setzero_fi .
 662  *
 663  * \copydetails gmx_simd_setzero_fi
 664  */
 665 #    define gmx_simd_setzero_i               gmx_simd_setzero_fi
 666
 667
 668 /*! \}
 669  *  \name SIMD floating-point logical operations on gmx_simd_real_t
 670  *
 671  *  These instructions are available if \ref GMX_SIMD_HAVE_LOGICAL is 1.
 672  *  \{
 673  */
 674
 675 /*! \brief Bitwise \a and on two \ref gmx_simd_real_t.
 676  *
 677  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_and_d,
 678  * otherwise \ref gmx_simd_and_f.
 679  *
 680  * \copydetails gmx_simd_and_f
 681  */
 682 #    define gmx_simd_and_r                   gmx_simd_and_f
 683
 684 /*! \brief Bitwise \a and-not on two \ref gmx_simd_real_t; 1st arg is complemented.
 685  *
 686  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_andnot_d,
 687  * otherwise \ref gmx_simd_andnot_f.
 688  *
 689  * \copydetails gmx_simd_andnot_f
 690  */
 691 #    define gmx_simd_andnot_r                gmx_simd_andnot_f
 692
 693 /*! \brief Bitwise \a or on two \ref gmx_simd_real_t.
 694  *
 695  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_or_d,
 696  * otherwise \ref gmx_simd_or_f.
 697  *
 698  * \copydetails gmx_simd_or_f
 699  */
 700 #    define gmx_simd_or_r                    gmx_simd_or_f
 701
 702 /*! \brief Bitwise \a exclusive-or on two \ref gmx_simd_real_t.
 703  *
 704  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_xor_d,
 705  * otherwise \ref gmx_simd_xor_f.
 706  *
 707  * \copydetails gmx_simd_xor_f
 708  */
 709 #    define gmx_simd_xor_r                   gmx_simd_xor_f
 710
 711 /*! \}
 712  *  \name SIMD floating-point arithmetic operations on gmx_simd_real_t
 713  *  \{
 714  */
 715
 716 /*! \brief SIMD a+b for two \ref gmx_simd_real_t.
 717  *
 718  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_add_d,
 719  * otherwise \ref gmx_simd_add_f.
 720  *
 721  * \copydetails gmx_simd_add_f
 722  */
 723 #    define gmx_simd_add_r                   gmx_simd_add_f
 724
 725 /*! \brief SIMD a-b for two \ref gmx_simd_real_t.
 726  *
 727  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_sub_d,
 728  * otherwise \ref gmx_simd_sub_f.
 729  *
 730  * \copydetails gmx_simd_sub_f
 731  */
 732 #    define gmx_simd_sub_r                   gmx_simd_sub_f
 733
 734 /*! \brief SIMD a*b for two \ref gmx_simd_real_t.
 735  *
 736  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_mul_d,
 737  * otherwise \ref gmx_simd_mul_f.
 738  *
 739  * \copydetails gmx_simd_mul_f
 740  */
 741 #    define gmx_simd_mul_r                   gmx_simd_mul_f
 742
 743 /*! \brief SIMD a*b+c for three \ref gmx_simd_real_t.
 744  *
 745  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_fmadd_d,
 746  * otherwise \ref gmx_simd_fmadd_f.
 747  *
 748  * \copydetails gmx_simd_fmadd_f
 749  */
 750 #    define gmx_simd_fmadd_r                 gmx_simd_fmadd_f
 751
 752 /*! \brief SIMD a*b-c for three \ref gmx_simd_real_t.
 753  *
 754  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_fmsub_d,
 755  * otherwise \ref gmx_simd_fmsub_f.
 756  *
 757  * \copydetails gmx_simd_fmsub_f
 758  */
 759 #    define gmx_simd_fmsub_r                 gmx_simd_fmsub_f
 760
 761 /*! \brief SIMD -a*b+c for three \ref gmx_simd_real_t.
 762  *
 763  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_fnmadd_d,
 764  * otherwise \ref gmx_simd_fnmadd_f.
 765  *
 766  * \copydetails gmx_simd_fnmadd_f
 767  */
 768 #    define gmx_simd_fnmadd_r                gmx_simd_fnmadd_f
 769
 770 /*! \brief SIMD -a*b-c for three \ref gmx_simd_real_t.
 771  *
 772  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_fnmsub_d,
 773  * otherwise \ref gmx_simd_fnmsub_f.
 774  *
 775  * \copydetails gmx_simd_fnmsub_f
 776  */
 777 #    define gmx_simd_fnmsub_r                gmx_simd_fnmsub_f
 778
 779 /*! \brief SIMD table lookup for 1/sqrt(x) approximation.
 780  *
 781  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_rsqrt_d,
 782  * otherwise \ref gmx_simd_rsqrt_f.
 783  *
 784  * \copydetails gmx_simd_rsqrt_f
 785  */
 786 #    define gmx_simd_rsqrt_r                 gmx_simd_rsqrt_f
 787
 788 /*! \brief SIMD table lookup for 1/x approximation.
 789  *
 790  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_rcp_d,
 791  * otherwise \ref gmx_simd_rcp_f.
 792  *
 793  * \copydetails gmx_simd_rcp_f
 794  */
 795 #    define gmx_simd_rcp_r                   gmx_simd_rcp_f
 796
 797 /*! \brief SIMD fabs(x) for \ref gmx_simd_real_t.
 798  *
 799  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_fabs_d,
 800  * otherwise \ref gmx_simd_fabs_f.
 801  *
 802  * \copydetails gmx_simd_fabs_f
 803  */
 804 #    define gmx_simd_fabs_r                  gmx_simd_fabs_f
 805
 806 /*! \brief SIMD -x for \ref gmx_simd_real_t.
 807  *
 808  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_fneg_d,
 809  * otherwise \ref gmx_simd_fneg_f.
 810  *
 811  * \copydetails gmx_simd_fneg_f
 812  */
 813 #    define gmx_simd_fneg_r                  gmx_simd_fneg_f
 814
 815 /*! \brief SIMD max(a,b) for each element in \ref gmx_simd_real_t.
 816  *
 817  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_max_d,
 818  * otherwise \ref gmx_simd_max_f.
 819  *
 820  * \copydetails gmx_simd_max_f
 821  */
 822 #    define gmx_simd_max_r                   gmx_simd_max_f
 823
 824 /*! \brief SIMD min(a,b) for each element in \ref gmx_simd_real_t.
 825  *
 826  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_min_d,
 827  * otherwise \ref gmx_simd_min_f.
 828  *
 829  * \copydetails gmx_simd_min_f
 830  */
 831 #    define gmx_simd_min_r                   gmx_simd_min_f
 832
 833 /*! \brief Round \ref gmx_simd_real_t to nearest int, return \ref gmx_simd_real_t.
 834  *
 835  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_round_d,
 836  * otherwise \ref gmx_simd_round_f.
 837  *
 838  * \copydetails gmx_simd_round_f
 839  */
 840 #    define gmx_simd_round_r                 gmx_simd_round_f
 841
 842 /*! \brief Truncate \ref gmx_simd_real_t towards 0, return \ref gmx_simd_real_t.
 843  *
 844  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_trunc_d,
 845  * otherwise \ref gmx_simd_trunc_f.
 846  *
 847  * \copydetails gmx_simd_trunc_f
 848  */
 849 #    define gmx_simd_trunc_r                 gmx_simd_trunc_f
 850
 851 /*! \brief SIMD Fraction, i.e. x-trunc(x) for \ref gmx_simd_real_t.
 852  *
 853  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_fraction_d,
 854  * otherwise \ref gmx_simd_fraction_f.
 855  *
 856  * \copydetails gmx_simd_fraction_f
 857  */
 858 #    define gmx_simd_fraction_r              gmx_simd_fraction_f
 859
 860 /*! \brief Return the FP exponent of a SIMD \ref gmx_simd_real_t as a \ref gmx_simd_real_t.
 861  *
 862  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_get_exponent_d,
 863  * otherwise \ref gmx_simd_get_exponent_f.
 864  *
 865  * \copydetails gmx_simd_get_exponent_f
 866  */
 867 #    define gmx_simd_get_exponent_r          gmx_simd_get_exponent_f
 868
 869 /*! \brief Return the FP mantissa of a SIMD \ref gmx_simd_real_t as a \ref gmx_simd_real_t.
 870  *
 871  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_get_mantissa_d,
 872  * otherwise \ref gmx_simd_get_mantissa_f.
 873  *
 874  * \copydetails gmx_simd_get_mantissa_f
 875  */
 876 #    define gmx_simd_get_mantissa_r          gmx_simd_get_mantissa_f
 877
 878 /*! \brief Set the exponent of a SIMD \ref gmx_simd_real_t from a \ref gmx_simd_real_t.
 879  *
 880  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_set_exponent_d,
 881  * otherwise \ref gmx_simd_set_exponent_f.
 882  *
 883  * \copydetails gmx_simd_set_exponent_f
 884  */
 885 #    define gmx_simd_set_exponent_r          gmx_simd_set_exponent_f
 886
 887 /*! \}
 888  *  \name SIMD comparison, boolean, and select operations for gmx_simd_real_t
 889  *  \{
 890  */
 891
 892 /*! \brief SIMD a==b for \ref gmx_simd_real_t. Returns a \ref gmx_simd_bool_t.
 893  *
 894  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_cmpeq_d,
 895  * otherwise \ref gmx_simd_cmpeq_f.
 896  *
 897  * \copydetails gmx_simd_cmpeq_f
 898  */
 899 #    define gmx_simd_cmpeq_r                 gmx_simd_cmpeq_f
 900
 901 /*! \brief SIMD a<b for \ref gmx_simd_real_t. Returns a \ref gmx_simd_bool_t.
 902  *
 903  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_cmplt_d,
 904  * otherwise \ref gmx_simd_cmplt_f.
 905  *
 906  * \copydetails gmx_simd_cmplt_f
 907  */
 908 #    define gmx_simd_cmplt_r                 gmx_simd_cmplt_f
 909
 910 /*! \brief SIMD a<=b for \ref gmx_simd_real_t. Returns a \ref gmx_simd_bool_t.
 911  *
 912  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_cmple_d,
 913  * otherwise \ref gmx_simd_cmple_f.
 914  *
 915  * \copydetails gmx_simd_cmple_f
 916  */
 917 #    define gmx_simd_cmple_r                 gmx_simd_cmple_f
 918
 919 /*! \brief For each element, the result boolean is true if both arguments are true
 920  *
 921  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_and_db,
 922  * otherwise \ref gmx_simd_and_fb.
 923  *
 924  * \copydetails gmx_simd_and_fb
 925  */
 926 #    define gmx_simd_and_b                   gmx_simd_and_fb
 927
 928 /*! \brief For each element, the result boolean is true if either argument is true
 929  *
 930  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_or_db,
 931  * otherwise \ref gmx_simd_or_fb.
 932  *
 933  * \copydetails gmx_simd_or_fb
 934  */
 935 #    define gmx_simd_or_b                    gmx_simd_or_fb
 936
 937 /*! \brief Return nonzero if any element in gmx_simd_bool_t is true, otherwise 0.
 938  *
 939  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_anytrue_db,
 940  * otherwise \ref gmx_simd_anytrue_fb.
 941  *
 942  * \copydetails gmx_simd_anytrue_fb
 943  */
 944 #    define gmx_simd_anytrue_b               gmx_simd_anytrue_fb
 945
 946 /*! \brief Selects elements from \ref gmx_simd_real_t where boolean is true, otherwise 0.
 947  *
 948  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_blendzero_d,
 949  * otherwise \ref gmx_simd_blendzero_f.
 950  *
 951  * \copydetails gmx_simd_blendzero_f
 952  *
 953  * \sa gmx_simd_blendzero_i
 954  */
 955 #    define gmx_simd_blendzero_r             gmx_simd_blendzero_f
 956
 957 /*! \brief Selects elements from \ref gmx_simd_real_t where boolean is false, otherwise 0.
 958  *
 959  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_blendnotzero_d,
 960  * otherwise \ref gmx_simd_blendnotzero_f.
 961  *
 962  * \copydetails gmx_simd_blendnotzero_f
 963  */
 964 #    define gmx_simd_blendnotzero_r          gmx_simd_blendnotzero_f
 965
 966 /*! \brief Selects from 2nd real SIMD arg where boolean is true, otherwise 1st arg.
 967  *
 968  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_blendv_d,
 969  * otherwise \ref gmx_simd_blendv_f.
 970  *
 971  * \copydetails gmx_simd_blendv_f
 972  */
 973 #    define gmx_simd_blendv_r                gmx_simd_blendv_f
 974
 975 /*! \brief Return sum of all elements in SIMD floating-point variable.
 976  *
 977  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_reduce_d,
 978  * otherwise \ref gmx_simd_reduce_f.
 979  *
 980  * \copydetails gmx_simd_reduce_f
 981  */
 982 #    define gmx_simd_reduce_r                gmx_simd_reduce_f
 983
 984 /*! \}
 985  *  \name SIMD integer logical operations on gmx_simd_int32_t
 986  *
 987  *  These instructions are available if \ref GMX_SIMD_HAVE_INT32_LOGICAL is 1.
 988  *  \{
 989  */
 990
 991 /*! \brief Shift each element in \ref gmx_simd_int32_t left by immediate
 992  *
 993  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_slli_di,
 994  * otherwise \ref gmx_simd_slli_fi.
 995  *
 996  * \copydetails gmx_simd_slli_fi
 997  */
 998 #    define gmx_simd_slli_i                  gmx_simd_slli_fi
 999
1000 /*! \brief Shift each element in \ref gmx_simd_int32_t right by immediate
1001  *
1002  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_srli_di,
1003  * otherwise \ref gmx_simd_srli_fi.
1004  *
1005  * \copydetails gmx_simd_srli_fi
1006  */
1007 #    define gmx_simd_srli_i                  gmx_simd_srli_fi
1008
1009 /*! \brief Bitwise \a and on two \ref gmx_simd_int32_t.
1010  *
1011  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_and_di,
1012  * otherwise \ref gmx_simd_and_fi.
1013  *
1014  * \copydetails gmx_simd_and_fi
1015  */
1016 #    define gmx_simd_and_i                   gmx_simd_and_fi
1017
1018 /*! \brief Bitwise \a and-not on two \ref gmx_simd_int32_t; 1st arg is complemented.
1019  *
1020  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_andnot_di,
1021  * otherwise \ref gmx_simd_andnot_fi.
1022  *
1023  * \copydetails gmx_simd_andnot_fi
1024  */
1025 #    define gmx_simd_andnot_i                gmx_simd_andnot_fi
1026
1027 /*! \brief Bitwise \a or on two \ref gmx_simd_int32_t.
1028  *
1029  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_or_di,
1030  * otherwise \ref gmx_simd_or_fi.
1031  *
1032  * \copydetails gmx_simd_or_fi
1033  */
1034 #    define gmx_simd_or_i                    gmx_simd_or_fi
1035
1036 /*! \brief Bitwise \a xor on two \ref gmx_simd_int32_t.
1037  *
1038  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_xor_di,
1039  * otherwise \ref gmx_simd_xor_fi.
1040  *
1041  * \copydetails gmx_simd_xor_fi
1042  */
1043 #    define gmx_simd_xor_i                   gmx_simd_xor_fi
1044
1045 /*! \}
1046  *  \name SIMD integer arithmetic operations on gmx_simd_int32_t
1047  *
1048  *  These instructions are available if \ref GMX_SIMD_HAVE_INT32_ARITHMETICS is 1.
1049  *  \{
1050  */
1051
1052 /*! \brief SIMD a+b for two \ref gmx_simd_int32_t.
1053  *
1054  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_add_di,
1055  * otherwise \ref gmx_simd_add_fi.
1056  *
1057  * \copydetails gmx_simd_add_fi
1058  */
1059 #    define gmx_simd_add_i                   gmx_simd_add_fi
1060
1061 /*! \brief SIMD a-b for two \ref gmx_simd_int32_t.
1062  *
1063  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_sub_di,
1064  * otherwise \ref gmx_simd_sub_fi.
1065  *
1066  * \copydetails gmx_simd_sub_fi
1067  */
1068 #    define gmx_simd_sub_i                   gmx_simd_sub_fi
1069
1070 /*! \brief SIMD a*b for two \ref gmx_simd_int32_t.
1071  *
1072  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_mul_di,
1073  * otherwise \ref gmx_simd_mul_fi.
1074  *
1075  * \copydetails gmx_simd_mul_fi
1076  */
1077 #    define gmx_simd_mul_i                   gmx_simd_mul_fi
1078
1079 /*! \}
1080  *  \name SIMD integer comparison, booleans, and selection on gmx_simd_int32_t
1081  *
1082  *  These instructions are available if \ref GMX_SIMD_HAVE_INT32_ARITHMETICS is 1.
1083  *  \{
1084  */
1085
1086 /*! \brief Returns boolean describing whether a==b, for \ref gmx_simd_int32_t
1087  *
1088  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_cmpeq_di,
1089  * otherwise \ref gmx_simd_cmpeq_fi.
1090  *
1091  * \copydetails gmx_simd_cmpeq_fi
1092  */
1093 #    define gmx_simd_cmpeq_i                 gmx_simd_cmpeq_fi
1094
1095 /*! \brief Returns boolean describing whether a<b, for \ref gmx_simd_int32_t
1096  *
1097  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_cmplt_di,
1098  * otherwise \ref gmx_simd_cmplt_fi.
1099  *
1100  * \copydetails gmx_simd_cmplt_fi
1101  */
1102 #    define gmx_simd_cmplt_i                 gmx_simd_cmplt_fi
1103
1104 /*! \brief For each element, the result boolean is true if both arguments are true
1105  *
1106  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_and_dib,
1107  * otherwise \ref gmx_simd_and_fib.
1108  *
1109  * \copydetails gmx_simd_and_fib
1110  */
1111 #    define gmx_simd_and_ib                  gmx_simd_and_fib
1112
1113 /*! \brief For each element, the result boolean is true if either argument is true.
1114  *
1115  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_or_dib,
1116  * otherwise \ref gmx_simd_or_fib.
1117  *
1118  * \copydetails gmx_simd_or_fib
1119  */
1120 #    define gmx_simd_or_ib                   gmx_simd_or_fib
1121
1122 /*! \brief Return nonzero if any element in gmx_simd_ibool_t is true, otherwise 0.
1123  *
1124  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_anytrue_dib,
1125  * otherwise \ref gmx_simd_anytrue_fib.
1126  *
1127  * \copydetails gmx_simd_anytrue_fib
1128  */
1129 #    define gmx_simd_anytrue_ib              gmx_simd_anytrue_fib
1130
1131 /*! \brief Selects elements from \ref gmx_simd_int32_t where boolean is true, otherwise 0.
1132  *
1133  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_blendzero_di,
1134  * otherwise \ref gmx_simd_blendzero_fi.
1135  *
1136  * \copydetails gmx_simd_blendzero_fi
1137  */
1138 #    define gmx_simd_blendzero_i             gmx_simd_blendzero_fi
1139
1140 /*! \brief Selects elements from \ref gmx_simd_int32_t where boolean is false, otherwise 0.
1141  *
1142  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_blendnotzero_di,
1143  * otherwise \ref gmx_simd_blendnotzero_fi.
1144  *
1145  * \copydetails gmx_simd_blendnotzero_fi
1146  */
1147 #    define gmx_simd_blendnotzero_i          gmx_simd_blendnotzero_fi
1148
1149 /*! \brief Selects from 2nd int SIMD arg where boolean is true, otherwise 1st arg.
1150  *
1151  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_blendv_di,
1152  * otherwise \ref gmx_simd_blendv_fi.
1153  *
1154  * \copydetails gmx_simd_blendv_fi
1155  */
1156 #    define gmx_simd_blendv_i                gmx_simd_blendv_fi
1157
1158 /*! \}
1159  *  \name SIMD conversion operations
1160  *
1161  *  These instructions are available when both types involved in the conversion
1162  *  are defined, e.g. if \ref GMX_SIMD_HAVE_REAL and \ref GMX_SIMD_HAVE_INT32
1163  *  are 1 for real-to-integer conversion.
1164  *  \{
1165  */
1166
1167 /*! \brief Convert gmx_simd_real_t to gmx_simd_int32_t, round to nearest integer.
1168  *
1169  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_cvt_d2i,
1170  * otherwise \ref gmx_simd_cvt_f2i.
1171  *
1172  * \copydetails gmx_simd_cvt_f2i
1173  */
1174 #    define gmx_simd_cvt_r2i                 gmx_simd_cvt_f2i
1175
1176 /*! \brief Convert gmx_simd_real_t to gmx_simd_int32_t, truncate towards zero
1177  *
1178  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_cvtt_d2i,
1179  * otherwise \ref gmx_simd_cvtt_f2i.
1180  *
1181  * \copydetails gmx_simd_cvtt_f2i
1182  */
1183 #    define gmx_simd_cvtt_r2i                gmx_simd_cvtt_f2i
1184
1185 /*! \brief Convert gmx_simd_int32_t to gmx_simd_real_t
1186  *
1187  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_cvt_i2d,
1188  * otherwise \ref gmx_simd_cvt_i2f.
1189  *
1190  * \copydetails gmx_simd_cvt_i2f
1191  */
1192 #    define gmx_simd_cvt_i2r                 gmx_simd_cvt_i2f
1193
1194 /*! \brief Convert from gmx_simd_bool_t to gmx_simd_ibool_t
1195  *
1196  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_cvt_db2dib,
1197  * otherwise \ref gmx_simd_cvt_fb2fib.
1198  *
1199  * \copydetails gmx_simd_cvt_fb2fib
1200  */
1201 #    define gmx_simd_cvt_b2ib                gmx_simd_cvt_fb2fib
1202
1203 /*! \brief Convert from gmx_simd_ibool_t to gmx_simd_bool_t
1204  *
1205  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_cvt_dib2db,
1206  * otherwise \ref gmx_simd_cvt_fib2fb.
1207  *
1208  * \copydetails gmx_simd_cvt_fib2fb
1209  */
1210 #    define gmx_simd_cvt_ib2b                gmx_simd_cvt_fib2fb
1211
1212
1213 /*! \}
1214  *  \name SIMD memory alignment operations
1215  *  \{
1216  */
1217
1218 /*! \brief Align real memory for SIMD usage.
1219  *
1220  * This routine will only align memory if \ref GMX_SIMD_HAVE_REAL is 1.
1221  * Otherwise the original pointer will be returned.
1222  *
1223  * Start by allocating an extra \ref GMX_SIMD_REAL_WIDTH float elements of memory,
1224  * and then call this function. The returned pointer will be greater or equal
1225  * to the one you provided, and point to an address inside your provided memory
1226  * that is aligned to the SIMD width.
1227  *
1228  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_align_d,
1229  * otherwise \ref gmx_simd_align_f. For detailed documentation, see the
1230  * precision-specific implementation routines.
1231  */
1232 #    define gmx_simd_align_r                 gmx_simd_align_f
1233
1234 /*! \brief Align integer memory for SIMD usage.
1235  *
1236  * This routine will only align memory if \ref GMX_SIMD_HAVE_INT32 is 1.
1237  * Otherwise the original pointer will be returned.
1238  *
1239  * Start by allocating an extra \ref GMX_SIMD_INT32_WIDTH elements of memory,
1240  * and then call this function. The returned pointer will be greater or equal
1241  * to the one you provided, and point to an address inside your provided memory
1242  * that is aligned to the SIMD width.
1243  *
1244  * If GMX_DOUBLE is defined, this will be aliased to \ref gmx_simd_align_di,
1245  * otherwise \ref gmx_simd_align_fi. For detailed documentation, see the
1246  * precision-specific implementation routines.
1247  */
1248 #    define gmx_simd_align_i                 gmx_simd_align_fi
1249
1250 /*! \} */
1251
1252 /*! \name SIMD4 - constant width-four SIMD datatypes
1253  *
1254  * These operations are only meant to be used for a few coordinate
1255  * manipulation and grid interpolation routines, so we only support a subset
1256  * of operations for SIMD4. To avoid repeating all the documentation from
1257  * the generic width SIMD routines, we only provide brief documentation for
1258  * these operations. Follow the link to the implementation documentation or the
1259  * reference to the corresponding generic SIMD routine. The format will be
1260  * exactly the same, but they have SIMD replaced with SIMD4.
1261  *  \{
1262  */
1263
1264 /*! \brief SIMD real datatype guaranteed to be 4 elements wide, if available.
1265  *
1266  * All the SIMD4 datatypes and operations behave like their counterparts for
1267  * the generic SIMD implementation, but they might be implemented with different
1268  * registers, or not supported at all. It is important that you check the
1269  * define \ref GMX_SIMD4_HAVE_REAL before using it.
1270  *
1271  * Just as the normal SIMD operations, all SIMD4 types and routines will
1272  * be aliased to either single or double precision ones based on whether
1273  * GMX_DOUBLE is defined.
1274  *
1275  * \note There is no support for integer or math operations in SIMD4.
1276  */
1277 #    define gmx_simd4_real_t                 gmx_simd4_float_t
1278
1279 /*! \brief Boolean for \ref gmx_simd4_real_t comparision/selection */
1280 #    define gmx_simd4_bool_t                 gmx_simd4_fbool_t
1281
1282 /*! \brief Load aligned data to gmx_simd4_real_t.
1283  *
1284  * \copydetails gmx_simd4_load_f
1285  */
1286 #    define gmx_simd4_load_r                 gmx_simd4_load_f
1287
1288 /*! \brief Load single element to gmx_simd4_real_t
1289  *
1290  * \copydetails gmx_simd4_load1_f
1291  */
1292 #    define gmx_simd4_load1_r                gmx_simd4_load1_f
1293
1294 /*! \brief Set gmx_simd4_real_t from scalar value
1295  *
1296  * \copydetails gmx_simd4_set1_f
1297  */
1298 #    define gmx_simd4_set1_r                 gmx_simd4_set1_f
1299
1300 /*! \brief store aligned data from gmx_simd4_real_t
1301  *
1302  * \copydetails gmx_simd4_store_f
1303  */
1304 #    define gmx_simd4_store_r                gmx_simd4_store_f
1305
1306 /*! \brief Load unaligned data to gmx_simd4_real_t
1307  *
1308  * \copydetails gmx_simd4_loadu_f
1309  */
1310 #    define gmx_simd4_loadu_r                gmx_simd4_loadu_f
1311
1312 /*! \brief Store unaligned data from gmx_simd4_real_t
1313  *
1314  * \copydetails gmx_simd4_storeu_f
1315  */
1316 #    define gmx_simd4_storeu_r               gmx_simd4_storeu_f
1317
1318 /*! \brief Set all elements in gmx_simd4_real_t to 0.0
1319  *
1320  * \copydetails gmx_simd4_setzero_f
1321  */
1322 #    define gmx_simd4_setzero_r              gmx_simd4_setzero_f
1323
1324 /*! \brief Bitwise and for two gmx_simd4_real_t
1325  *
1326  * \copydetails gmx_simd4_and_f
1327  */
1328 #    define gmx_simd4_and_r                  gmx_simd4_and_f
1329
1330 /*! \brief Bitwise and-not for two gmx_simd4_real_t. 1st arg is complemented.
1331  *
1332  * \copydetails gmx_simd4_andnot_f
1333  */
1334 #    define gmx_simd4_andnot_r               gmx_simd4_andnot_f
1335
1336 /*! \brief Bitwise or for two gmx_simd4_real_t
1337  *
1338  * \copydetails gmx_simd4_or_f
1339  */
1340 #    define gmx_simd4_or_r                   gmx_simd4_or_f
1341
1342 /*! \brief Bitwise xor for two gmx_simd4_real_t
1343  *
1344  * \copydetails gmx_simd4_xor_f
1345  */
1346 #    define gmx_simd4_xor_r                  gmx_simd4_xor_f
1347
1348 /*! \brief a+b for \ref gmx_simd4_real_t
1349  *
1350  * \copydetails gmx_simd4_add_f
1351  */
1352 #    define gmx_simd4_add_r                  gmx_simd4_add_f
1353
1354 /*! \brief a-b for \ref gmx_simd4_real_t
1355  *
1356  * \copydetails gmx_simd4_sub_f
1357  */
1358 #    define gmx_simd4_sub_r                  gmx_simd4_sub_f
1359
1360 /*! \brief a*b for \ref gmx_simd4_real_t
1361  *
1362  * \copydetails gmx_simd4_mul_f
1363  */
1364 #    define gmx_simd4_mul_r                  gmx_simd4_mul_f
1365
1366 /*! \brief a*b+c for \ref gmx_simd4_real_t
1367  *
1368  * \copydetails gmx_simd4_fmadd_f
1369  */
1370 #    define gmx_simd4_fmadd_r                gmx_simd4_fmadd_f
1371
1372 /*! \brief a*b-c for \ref gmx_simd4_real_t
1373  *
1374  * \copydetails gmx_simd4_fmsub_f
1375  */
1376 #    define gmx_simd4_fmsub_r                gmx_simd4_fmsub_f
1377
1378 /*! \brief -a*b+c for \ref gmx_simd4_real_t
1379  *
1380  * \copydetails gmx_simd4_fnmadd_f
1381  */
1382 #    define gmx_simd4_fnmadd_r               gmx_simd4_fnmadd_f
1383
1384 /*! \brief -a*b-c for \ref gmx_simd4_real_t
1385  *
1386  * \copydetails gmx_simd4_fnmsub_f
1387  */
1388 #    define gmx_simd4_fnmsub_r               gmx_simd4_fnmsub_f
1389
1390 /*! \brief 1/sqrt(x) approximate lookup for \ref gmx_simd4_real_t
1391  *
1392  * \copydetails gmx_simd4_rsqrt_f
1393  */
1394 #    define gmx_simd4_rsqrt_r                gmx_simd4_rsqrt_f
1395
1396 /*! \brief fabs(x) for \ref gmx_simd4_real_t
1397  *
1398  * \copydetails gmx_simd4_fabs_f
1399  */
1400 #    define gmx_simd4_fabs_r                 gmx_simd4_fabs_f
1401
1402 /*! \brief Change sign (-x) for \ref gmx_simd4_real_t
1403  *
1404  * \copydetails gmx_simd4_fneg_f
1405  */
1406 #    define gmx_simd4_fneg_r                 gmx_simd4_fneg_f
1407
1408 /*! \brief Select maximum of each pair of elements from args for \ref gmx_simd4_real_t
1409  *
1410  * \copydetails gmx_simd4_max_f
1411  */
1412 #    define gmx_simd4_max_r                  gmx_simd4_max_f
1413
1414 /*! \brief Select minimum of each pair of elements from args for \ref gmx_simd4_real_t
1415  *
1416  * \copydetails gmx_simd4_min_f
1417  */
1418 #    define gmx_simd4_min_r                  gmx_simd4_min_f
1419
1420 /*! \brief Round \ref gmx_simd4_real_t to nearest integer, return \ref gmx_simd4_real_t
1421  *
1422  * \copydetails gmx_simd4_round_f
1423  */
1424 #    define gmx_simd4_round_r                gmx_simd4_round_f
1425
1426 /*! \brief Truncate \ref gmx_simd4_real_t towards zero, return \ref gmx_simd4_real_t
1427  *
1428  * \copydetails gmx_simd4_trunc_f
1429  */
1430 #    define gmx_simd4_trunc_r                gmx_simd4_trunc_f
1431
1432 /*! \brief Scalar product of first three elements of two \ref gmx_simd4_real_t *
1433  *
1434  * \copydetails gmx_simd4_dotproduct3_f
1435  */
1436 #    define gmx_simd4_dotproduct3_r          gmx_simd4_dotproduct3_f
1437
1438 /*! \brief Return booleans whether a==b for each element two \ref gmx_simd4_real_t
1439  *
1440  * \copydetails gmx_simd4_cmpeq_f
1441  */
1442 #    define gmx_simd4_cmpeq_r                gmx_simd4_cmpeq_f
1443 /*! \brief Return booleans whether a<b for each element two \ref gmx_simd4_real_t
1444  *
1445  * \copydetails gmx_simd4_cmplt_f
1446  */
1447 #    define gmx_simd4_cmplt_r                gmx_simd4_cmplt_f
1448 /*! \brief Return booleans whether a<=b for each element two \ref gmx_simd4_real_t
1449  *
1450  * \copydetails gmx_simd4_cmple_f
1451  */
1452 #    define gmx_simd4_cmple_r                gmx_simd4_cmple_f
1453
1454 /*! \brief Logical and for two \ref gmx_simd4_bool_t
1455  *
1456  * \copydetails gmx_simd4_and_fb
1457  */
1458 #    define gmx_simd4_and_b                  gmx_simd4_and_fb
1459 /*! \brief Logical or for two \ref gmx_simd4_bool_t
1460  *
1461  * \copydetails gmx_simd4_or_fb
1462  */
1463 #    define gmx_simd4_or_b                   gmx_simd4_or_fb
1464
1465 /*! \brief Return nonzero if any element in \ref gmx_simd4_bool_t is true, otherwise 0
1466  *
1467  * \copydetails gmx_simd4_anytrue_fb
1468  */
1469 #    define gmx_simd4_anytrue_b              gmx_simd4_anytrue_fb
1470
1471 /*! \brief Selects from 2nd real SIMD4 arg where boolean is true, otherwise 1st arg
1472  *
1473  * \copydetails gmx_simd4_blendzero_f
1474  */
1475 #    define gmx_simd4_blendzero_r            gmx_simd4_blendzero_f
1476
1477 /*! \brief Selects from 2nd real SIMD4 arg where boolean is false, otherwise 1st arg
1478  *
1479  * \copydetails gmx_simd4_blendnotzero_f
1480  */
1481 #    define gmx_simd4_blendnotzero_r            gmx_simd4_blendnotzero_f
1482
1483 /*! \brief Selects from 2nd real SIMD4 arg where boolean is true, otherwise 1st arg
1484  *
1485  * \copydetails gmx_simd4_blendv_f
1486  */
1487 #    define gmx_simd4_blendv_r               gmx_simd4_blendv_f
1488
1489 /*! \brief Return sum of all elements in SIMD4 floating-point variable.
1490  *
1491  * \copydetails gmx_simd4_reduce_f
1492  */
1493 #    define gmx_simd4_reduce_r               gmx_simd4_reduce_f
1494
1495 /*! \brief Align real memory for SIMD4 usage.
1496  *
1497  * \copydetails gmx_simd4_align_f
1498  */
1499 #    define gmx_simd4_align_r                gmx_simd4_align_f
1500
1501 /*! \} */
1502
1503 /*! \name SIMD predefined macros to describe high-level capabilities
1504  *  \{
1505  */
1506
1507 /*! \brief 1 if gmx_simd_real_t is available, otherwise 0.
1508  *
1509  *  if GMX_DOUBLE is defined, this will be aliased to
1510  *  \ref GMX_SIMD_HAVE_DOUBLE, otherwise GMX_SIMD_HAVE_FLOAT.
1511  */
1512 #    define GMX_SIMD_HAVE_REAL               GMX_SIMD_HAVE_FLOAT
1513
1514 /*! \brief Width of gmx_simd_real_t.
1515  *
1516  *  if GMX_DOUBLE is defined, this will be aliased to
1517  *  \ref GMX_SIMD_DOUBLE_WIDTH, otherwise GMX_SIMD_FLOAT_WIDTH.
1518  */
1519 #    define GMX_SIMD_REAL_WIDTH              GMX_SIMD_FLOAT_WIDTH
1520
1521 /*! \brief 1 if gmx_simd_int32_t is available, otherwise 0.
1522  *
1523  *  if GMX_DOUBLE is defined, this will be aliased to
1524  *  \ref GMX_SIMD_HAVE_DINT32, otherwise GMX_SIMD_HAVE_FINT32.
1525  */
1526 #    define GMX_SIMD_HAVE_INT32              GMX_SIMD_HAVE_FINT32
1527
1528 /*! \brief Width of gmx_simd_int32_t.
1529  *
1530  *  if GMX_DOUBLE is defined, this will be aliased to
1531  *  \ref GMX_SIMD_DINT32_WIDTH, otherwise GMX_SIMD_FINT32_WIDTH.
1532  */
1533 #    define GMX_SIMD_INT32_WIDTH             GMX_SIMD_FINT32_WIDTH
1534
1535 /*! \brief 1 if gmx_simd_extract_i() is available, otherwise 0.
1536  *
1537  *  if GMX_DOUBLE is defined, this will correspond to
1538  *  \ref GMX_SIMD_HAVE_DINT32_EXTRACT, otherwise GMX_SIMD_HAVE_FINT32_EXTRACT.
1539  */
1540 #    define GMX_SIMD_HAVE_INT32_EXTRACT      GMX_SIMD_HAVE_FINT32_EXTRACT
1541
1542 /*! \brief 1 if logical ops are supported on gmx_simd_int32_t, otherwise 0.
1543  *
1544  *  if GMX_DOUBLE is defined, this will correspond to
1545  *  \ref GMX_SIMD_HAVE_DINT32_LOGICAL, otherwise GMX_SIMD_HAVE_FINT32_LOGICAL.
1546  */
1547 #    define GMX_SIMD_HAVE_INT32_LOGICAL      GMX_SIMD_HAVE_FINT32_LOGICAL
1548
1549 /*! \brief 1 if arithmetic ops are supported on gmx_simd_int32_t, otherwise 0.
1550  *
1551  *  if GMX_DOUBLE is defined, this will be aliased to
1552  *  \ref GMX_SIMD_HAVE_DINT32_ARITHMETICS, otherwise GMX_SIMD_HAVE_FINT32_ARITHMETICS.
1553  */
1554 #    define GMX_SIMD_HAVE_INT32_ARITHMETICS  GMX_SIMD_HAVE_FINT32_ARITHMETICS
1555
1556 /*! \brief 1 if gmx_simd4_real_t is available, otherwise 0.
1557  *
1558  *  if GMX_DOUBLE is defined, this will be aliased to
1559  *  \ref GMX_SIMD4_HAVE_DOUBLE, otherwise GMX_SIMD4_HAVE_FLOAT.
1560  */
1561 #    define GMX_SIMD4_HAVE_REAL              GMX_SIMD4_HAVE_FLOAT
1562
1563
1564 /*! \} */
1565
1566 #endif /* GMX_DOUBLE */
1567
1568 /*! \} */
1569 /*! \endcond */
1570
1571 #if 0
1572 /* Finally, a hack to cover a possible corner case of using an
1573    explicit GMX_SIMD_HAVE_FLOAT or GMX_SIMD_HAVE_DOUBLE, rather than
1574    GMX_SIMD_HAVE_REAL.
1575
1576    Such code is expected to include simd.h to get those symbols
1577    defined, but the actual definitions are in the implemention headers
1578    included by simd.h. check-source.py is not a full preprocessor, so
1579    it does not see the definitions in the implementation headers as
1580    belonging to simd.h, thus it cannot check that simd.h is being used
1581    correctly in the above hypothetical corner case. However, the
1582    checker also does not parse #if 0, so we can fool the checker into
1583    thinking that definition occurs here, and that will work well
1584    enough.
1585
1586    If there's ever other kinds of SIMD code that might have the same
1587    problem, we might want to add other variables here.
1588  */
1589 #    define GMX_SIMD_HAVE_FLOAT         1
1590 #    define GMX_SIMD_HAVE_DOUBLE        1
1591
1592 #endif /* 0 */
1593
1594 #endif /* GMX_SIMD_SIMD_H */