1 /* -*- mode: c; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4; c-file-style: "stroustrup"; -*-
4 * This source code is part of
8 * GROningen MAchine for Chemical Simulations
10 * Written by David van der Spoel, Erik Lindahl, Berk Hess, and others.
11 * Copyright (c) 1991-2000, University of Groningen, The Netherlands.
12 * Copyright (c) 2001-2012, The GROMACS development team,
13 * check out http://www.gromacs.org for more information.
15 * This program is free software; you can redistribute it and/or
16 * modify it under the terms of the GNU General Public License
17 * as published by the Free Software Foundation; either version 2
18 * of the License, or (at your option) any later version.
20 * If you want to redistribute modifications, please consider that
21 * scientific software is very special. Version control is crucial -
22 * bugs must be traceable. We will be happy to consider code for
23 * inclusion in the official distribution, but derived work must not
24 * be called official GROMACS. Details are found in the README & COPYING
25 * files - if they are missing, get the official version at www.gromacs.org.
27 * To help us fund GROMACS development, we humbly ask that you cite
28 * the papers on the package - you can find them in the top README file.
30 * For more info, check our website at http://www.gromacs.org
33 * Gallium Rubidium Oxygen Manganese Argon Carbon Silicon
36 #ifndef NBNXN_CUDA_TYPES_EXT_H
37 #define NBNXN_CUDA_TYPES_EXT_H
44 /* CUDA nonbonded structure */
45 typedef struct nbnxn_cuda
*nbnxn_cuda_ptr_t
;
46 /* CUDA GPU device info */
47 typedef struct cuda_dev_info
*cuda_dev_info_ptr_t
;
49 /* Types defined for the structs below. */
50 typedef struct wallclock_gpu wallclock_gpu_t
;
51 typedef struct nbnxn_cuda_ktime nbnxn_cuda_ktime_t
;
53 /* Nonbonded kernel time and call count. */
54 struct nbnxn_cuda_ktime
60 /* GPU timings for kernels and H2d/D2H transfers. */
63 nbnxn_cuda_ktime_t ktime
[2][2]; /* table containing the timings of the four
64 version of the nonbonded kernels: force-only,
65 force+energy, force+pruning, and force+energy+pruning */
66 double nb_h2d_t
; /* host to device transfer time in nb calculation */
67 double nb_d2h_t
; /* device to host transfer time in nb calculation */
68 int nb_c
; /* total call count of the nonbonded gpu operations */
69 double pl_h2d_t
; /* pair search step host to device transfer time */
70 int pl_h2d_c
; /* pair search step host to device transfer call count */
77 #endif /* NBNXN_CUDA_TYPES_EXT_H */