src/gromacs/mdlib/force.cpp

   1 /*
   2  * This file is part of the GROMACS molecular simulation package.
   3  *
   4  * Copyright (c) 1991-2000, University of Groningen, The Netherlands.
   5  * Copyright (c) 2001-2004, The GROMACS development team.
   6  * Copyright (c) 2013,2014,2015,2016,2017,2018,2019, by the GROMACS development team, led by
   7  * Mark Abraham, David van der Spoel, Berk Hess, and Erik Lindahl,
   8  * and including many others, as listed in the AUTHORS file in the
   9  * top-level source directory and at http://www.gromacs.org.
  10  *
  11  * GROMACS is free software; you can redistribute it and/or
  12  * modify it under the terms of the GNU Lesser General Public License
  13  * as published by the Free Software Foundation; either version 2.1
  14  * of the License, or (at your option) any later version.
  15  *
  16  * GROMACS is distributed in the hope that it will be useful,
  17  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  18  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  19  * Lesser General Public License for more details.
  20  *
  21  * You should have received a copy of the GNU Lesser General Public
  22  * License along with GROMACS; if not, see
  23  * http://www.gnu.org/licenses, or write to the Free Software Foundation,
  24  * Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA.
  25  *
  26  * If you want to redistribute modifications to GROMACS, please
  27  * consider that scientific software is very special. Version
  28  * control is crucial - bugs must be traceable. We will be happy to
  29  * consider code for inclusion in the official distribution, but
  30  * derived work must not be called official GROMACS. Details are found
  31  * in the README & COPYING files - if they are missing, get the
  32  * official version at http://www.gromacs.org.
  33  *
  34  * To help us fund GROMACS development, we humbly ask that you cite
  35  * the research papers on the package. Check out http://www.gromacs.org.
  36  */
  37 #include "gmxpre.h"
  38
  39 #include "force.h"
  40
  41 #include <cassert>
  42 #include <cmath>
  43 #include <cstring>
  44
  45 #include "gromacs/domdec/dlbtiming.h"
  46 #include "gromacs/domdec/domdec.h"
  47 #include "gromacs/domdec/domdec_struct.h"
  48 #include "gromacs/ewald/ewald.h"
  49 #include "gromacs/ewald/long_range_correction.h"
  50 #include "gromacs/ewald/pme.h"
  51 #include "gromacs/gmxlib/network.h"
  52 #include "gromacs/gmxlib/nrnb.h"
  53 #include "gromacs/listed_forces/listed_forces.h"
  54 #include "gromacs/math/vec.h"
  55 #include "gromacs/math/vecdump.h"
  56 #include "gromacs/mdlib/force_flags.h"
  57 #include "gromacs/mdlib/forcerec_threading.h"
  58 #include "gromacs/mdlib/qmmm.h"
  59 #include "gromacs/mdlib/rf_util.h"
  60 #include "gromacs/mdlib/wall.h"
  61 #include "gromacs/mdtypes/commrec.h"
  62 #include "gromacs/mdtypes/enerdata.h"
  63 #include "gromacs/mdtypes/forceoutput.h"
  64 #include "gromacs/mdtypes/forcerec.h"
  65 #include "gromacs/mdtypes/inputrec.h"
  66 #include "gromacs/mdtypes/md_enums.h"
  67 #include "gromacs/mdtypes/mdatom.h"
  68 #include "gromacs/pbcutil/ishift.h"
  69 #include "gromacs/pbcutil/mshift.h"
  70 #include "gromacs/pbcutil/pbc.h"
  71 #include "gromacs/timing/wallcycle.h"
  72 #include "gromacs/utility/exceptions.h"
  73 #include "gromacs/utility/fatalerror.h"
  74 #include "gromacs/utility/smalloc.h"
  75
  76 static void clearEwaldThreadOutput(ewald_corr_thread_t *ewc_t)
  77 {
  78     ewc_t->Vcorr_q        = 0;
  79     ewc_t->Vcorr_lj       = 0;
  80     ewc_t->dvdl[efptCOUL] = 0;
  81     ewc_t->dvdl[efptVDW]  = 0;
  82     clear_mat(ewc_t->vir_q);
  83     clear_mat(ewc_t->vir_lj);
  84 }
  85
  86 static void reduceEwaldThreadOuput(int nthreads, ewald_corr_thread_t *ewc_t)
  87 {
  88     ewald_corr_thread_t &dest = ewc_t[0];
  89
  90     for (int t = 1; t < nthreads; t++)
  91     {
  92         dest.Vcorr_q        += ewc_t[t].Vcorr_q;
  93         dest.Vcorr_lj       += ewc_t[t].Vcorr_lj;
  94         dest.dvdl[efptCOUL] += ewc_t[t].dvdl[efptCOUL];
  95         dest.dvdl[efptVDW]  += ewc_t[t].dvdl[efptVDW];
  96         m_add(dest.vir_q,  ewc_t[t].vir_q,  dest.vir_q);
  97         m_add(dest.vir_lj, ewc_t[t].vir_lj, dest.vir_lj);
  98     }
  99 }
 100
 101 void
 102 do_force_lowlevel(t_forcerec                               *fr,
 103                   const t_inputrec                         *ir,
 104                   const t_idef                             *idef,
 105                   const t_commrec                          *cr,
 106                   const gmx_multisim_t                     *ms,
 107                   t_nrnb                                   *nrnb,
 108                   gmx_wallcycle_t                           wcycle,
 109                   const t_mdatoms                          *md,
 110                   gmx::ArrayRefWithPadding<gmx::RVec>       coordinates,
 111                   history_t                                *hist,
 112                   gmx::ForceOutputs                        *forceOutputs,
 113                   gmx_enerdata_t                           *enerd,
 114                   t_fcdata                                 *fcd,
 115                   const matrix                              box,
 116                   const real                               *lambda,
 117                   const t_graph                            *graph,
 118                   const rvec                               *mu_tot,
 119                   const int                                 flags,
 120                   const DDBalanceRegionHandler             &ddBalanceRegionHandler)
 121 {
 122     // TODO: Replace all uses of x by const coordinates
 123     rvec *x = as_rvec_array(coordinates.paddedArrayRef().data());
 124
 125     // TODO: Add the shift forces to forceOutputs
 126     rvec *forceForUseWithShiftForces = forceOutputs->f();
 127     auto &forceWithVirial            = forceOutputs->forceWithVirial();
 128
 129     /* do QMMM first if requested */
 130     if (fr->bQMMM)
 131     {
 132         enerd->term[F_EQM] = calculate_QMMM(cr, forceForUseWithShiftForces, fr);
 133     }
 134
 135     /* Call the short range functions all in one go. */
 136
 137     if (ir->nwall)
 138     {
 139         /* foreign lambda component for walls */
 140         real dvdl_walls = do_walls(*ir, *fr, box, *md, x,
 141                                    &forceWithVirial, lambda[efptVDW],
 142                                    enerd->grpp.ener[egLJSR].data(), nrnb);
 143         enerd->dvdl_lin[efptVDW] += dvdl_walls;
 144     }
 145
 146     /* Shift the coordinates. Must be done before listed forces and PPPM,
 147      * but is also necessary for SHAKE and update, therefore it can NOT
 148      * go when no listed forces have to be evaluated.
 149      *
 150      * The shifting and PBC code is deliberately not timed, since with
 151      * the Verlet scheme it only takes non-zero time with triclinic
 152      * boxes, and even then the time is around a factor of 100 less
 153      * than the next smallest counter.
 154      */
 155
 156
 157     /* Here sometimes we would not need to shift with NBFonly,
 158      * but we do so anyhow for consistency of the returned coordinates.
 159      */
 160     if (graph)
 161     {
 162         shift_self(graph, box, x);
 163         if (TRICLINIC(box))
 164         {
 165             inc_nrnb(nrnb, eNR_SHIFTX, 2*graph->nnodes);
 166         }
 167         else
 168         {
 169             inc_nrnb(nrnb, eNR_SHIFTX, graph->nnodes);
 170         }
 171     }
 172
 173     {
 174         t_pbc      pbc;
 175
 176         /* Check whether we need to take into account PBC in listed interactions. */
 177         const auto needPbcForListedForces = fr->bMolPBC && bool(flags & GMX_FORCE_LISTED) && haveCpuListedForces(*fr, *idef, *fcd);
 178         if (needPbcForListedForces)
 179         {
 180             /* Since all atoms are in the rectangular or triclinic unit-cell,
 181              * only single box vector shifts (2 in x) are required.
 182              */
 183             set_pbc_dd(&pbc, fr->ePBC, DOMAINDECOMP(cr) ? cr->dd->nc : nullptr,
 184                        TRUE, box);
 185         }
 186
 187         do_force_listed(wcycle, box, ir->fepvals, cr, ms,
 188                         idef, x, hist,
 189                         forceForUseWithShiftForces, &forceWithVirial,
 190                         fr, &pbc, graph, enerd, nrnb, lambda, md, fcd,
 191                         DOMAINDECOMP(cr) ? cr->dd->globalAtomIndices.data() : nullptr,
 192                         flags);
 193     }
 194
 195     const bool computePmeOnCpu =
 196         (EEL_PME(fr->ic->eeltype) || EVDW_PME(fr->ic->vdwtype)) &&
 197         thisRankHasDuty(cr, DUTY_PME) &&
 198         (pme_run_mode(fr->pmedata) == PmeRunMode::CPU);
 199
 200     const bool haveEwaldSurfaceTerms =
 201         EEL_PME_EWALD(fr->ic->eeltype) &&
 202         (ir->ewald_geometry != eewg3D || ir->epsilon_surface != 0);
 203
 204     /* Do long-range electrostatics and/or LJ-PME
 205      * and compute PME surface terms when necessary.
 206      */
 207     if (computePmeOnCpu ||
 208         fr->ic->eeltype == eelEWALD ||
 209         haveEwaldSurfaceTerms)
 210     {
 211         int  status            = 0;
 212         real Vlr_q             = 0, Vlr_lj = 0;
 213
 214         /* We reduce all virial, dV/dlambda and energy contributions, except
 215          * for the reciprocal energies (Vlr_q, Vlr_lj) into the same struct.
 216          */
 217         ewald_corr_thread_t &ewaldOutput = fr->ewc_t[0];
 218         clearEwaldThreadOutput(&ewaldOutput);
 219
 220         if (EEL_PME_EWALD(fr->ic->eeltype) || EVDW_PME(fr->ic->vdwtype))
 221         {
 222             /* Calculate Ewald surface terms, when necessary */
 223             if (haveEwaldSurfaceTerms)
 224             {
 225                 wallcycle_sub_start(wcycle, ewcsEWALD_CORRECTION);
 226
 227                 if (fr->n_tpi > 0)
 228                 {
 229                     gmx_fatal(FARGS, "TPI with PME currently only works in a 3D geometry with tin-foil boundary conditions");
 230                 }
 231
 232                 int nthreads = fr->nthread_ewc;
 233 #pragma omp parallel for num_threads(nthreads) schedule(static)
 234                 for (int t = 0; t < nthreads; t++)
 235                 {
 236                     try
 237                     {
 238                         ewald_corr_thread_t &ewc_t = fr->ewc_t[t];
 239                         if (t > 0)
 240                         {
 241                             clearEwaldThreadOutput(&ewc_t);
 242                         }
 243
 244                         /* Threading is only supported with the Verlet cut-off
 245                          * scheme and then only single particle forces (no
 246                          * exclusion forces) are calculated, so we can store
 247                          * the forces in the normal, single forceWithVirial->force_ array.
 248                          */
 249                         ewald_LRcorrection(md->homenr, cr, nthreads, t, fr, ir,
 250                                            md->chargeA, md->chargeB,
 251                                            (md->nChargePerturbed != 0),
 252                                            x, box, mu_tot,
 253                                            ir->ewald_geometry,
 254                                            ir->epsilon_surface,
 255                                            as_rvec_array(forceWithVirial.force_.data()),
 256                                            &ewc_t.Vcorr_q,
 257                                            lambda[efptCOUL],
 258                                            &ewc_t.dvdl[efptCOUL]);
 259                     }
 260                     GMX_CATCH_ALL_AND_EXIT_WITH_FATAL_ERROR;
 261                 }
 262                 if (nthreads > 1)
 263                 {
 264                     reduceEwaldThreadOuput(nthreads, fr->ewc_t);
 265                 }
 266                 wallcycle_sub_stop(wcycle, ewcsEWALD_CORRECTION);
 267             }
 268
 269             if (EEL_PME_EWALD(fr->ic->eeltype) && fr->n_tpi == 0)
 270             {
 271                 /* This is not in a subcounter because it takes a
 272                    negligible and constant-sized amount of time */
 273                 ewaldOutput.Vcorr_q +=
 274                     ewald_charge_correction(cr, fr, lambda[efptCOUL], box,
 275                                             &ewaldOutput.dvdl[efptCOUL],
 276                                             ewaldOutput.vir_q);
 277             }
 278
 279             if (computePmeOnCpu)
 280             {
 281                 /* Do reciprocal PME for Coulomb and/or LJ. */
 282                 assert(fr->n_tpi >= 0);
 283                 if (fr->n_tpi == 0 || (flags & GMX_FORCE_STATECHANGED))
 284                 {
 285                     int pme_flags = GMX_PME_SPREAD | GMX_PME_SOLVE;
 286
 287                     if (flags & GMX_FORCE_FORCES)
 288                     {
 289                         pme_flags |= GMX_PME_CALC_F;
 290                     }
 291                     if (flags & GMX_FORCE_VIRIAL)
 292                     {
 293                         pme_flags |= GMX_PME_CALC_ENER_VIR;
 294                     }
 295                     if (fr->n_tpi > 0)
 296                     {
 297                         /* We don't calculate f, but we do want the potential */
 298                         pme_flags |= GMX_PME_CALC_POT;
 299                     }
 300
 301                     /* With domain decomposition we close the CPU side load
 302                      * balancing region here, because PME does global
 303                      * communication that acts as a global barrier.
 304                      */
 305                     ddBalanceRegionHandler.closeAfterForceComputationCpu();
 306
 307                     wallcycle_start(wcycle, ewcPMEMESH);
 308                     status = gmx_pme_do(fr->pmedata,
 309                                         gmx::constArrayRefFromArray(coordinates.unpaddedConstArrayRef().data(), md->homenr - fr->n_tpi),
 310                                         forceWithVirial.force_,
 311                                         md->chargeA, md->chargeB,
 312                                         md->sqrt_c6A, md->sqrt_c6B,
 313                                         md->sigmaA, md->sigmaB,
 314                                         box, cr,
 315                                         DOMAINDECOMP(cr) ? dd_pme_maxshift_x(cr->dd) : 0,
 316                                         DOMAINDECOMP(cr) ? dd_pme_maxshift_y(cr->dd) : 0,
 317                                         nrnb, wcycle,
 318                                         ewaldOutput.vir_q, ewaldOutput.vir_lj,
 319                                         &Vlr_q, &Vlr_lj,
 320                                         lambda[efptCOUL], lambda[efptVDW],
 321                                         &ewaldOutput.dvdl[efptCOUL],
 322                                         &ewaldOutput.dvdl[efptVDW],
 323                                         pme_flags);
 324                     wallcycle_stop(wcycle, ewcPMEMESH);
 325                     if (status != 0)
 326                     {
 327                         gmx_fatal(FARGS, "Error %d in reciprocal PME routine", status);
 328                     }
 329
 330                     /* We should try to do as little computation after
 331                      * this as possible, because parallel PME synchronizes
 332                      * the nodes, so we want all load imbalance of the
 333                      * rest of the force calculation to be before the PME
 334                      * call.  DD load balancing is done on the whole time
 335                      * of the force call (without PME).
 336                      */
 337                 }
 338                 if (fr->n_tpi > 0)
 339                 {
 340                     if (EVDW_PME(ir->vdwtype))
 341                     {
 342
 343                         gmx_fatal(FARGS, "Test particle insertion not implemented with LJ-PME");
 344                     }
 345                     /* Determine the PME grid energy of the test molecule
 346                      * with the PME grid potential of the other charges.
 347                      */
 348                     gmx_pme_calc_energy(fr->pmedata,
 349                                         coordinates.unpaddedConstArrayRef().subArray(md->homenr - fr->n_tpi, fr->n_tpi),
 350                                         gmx::arrayRefFromArray(md->chargeA + md->homenr - fr->n_tpi, fr->n_tpi),
 351                                         &Vlr_q);
 352                 }
 353             }
 354         }
 355
 356         if (fr->ic->eeltype == eelEWALD)
 357         {
 358             Vlr_q = do_ewald(ir, x, as_rvec_array(forceWithVirial.force_.data()),
 359                              md->chargeA, md->chargeB,
 360                              box, cr, md->homenr,
 361                              ewaldOutput.vir_q, fr->ic->ewaldcoeff_q,
 362                              lambda[efptCOUL], &ewaldOutput.dvdl[efptCOUL],
 363                              fr->ewald_table);
 364         }
 365
 366         /* Note that with separate PME nodes we get the real energies later */
 367         // TODO it would be simpler if we just accumulated a single
 368         // long-range virial contribution.
 369         forceWithVirial.addVirialContribution(ewaldOutput.vir_q);
 370         forceWithVirial.addVirialContribution(ewaldOutput.vir_lj);
 371         enerd->dvdl_lin[efptCOUL] += ewaldOutput.dvdl[efptCOUL];
 372         enerd->dvdl_lin[efptVDW]  += ewaldOutput.dvdl[efptVDW];
 373         enerd->term[F_COUL_RECIP]  = Vlr_q + ewaldOutput.Vcorr_q;
 374         enerd->term[F_LJ_RECIP]    = Vlr_lj + ewaldOutput.Vcorr_lj;
 375
 376         if (debug)
 377         {
 378             fprintf(debug, "Vlr_q = %g, Vcorr_q = %g, Vlr_corr_q = %g\n",
 379                     Vlr_q, ewaldOutput.Vcorr_q, enerd->term[F_COUL_RECIP]);
 380             pr_rvecs(debug, 0, "vir_el_recip after corr", ewaldOutput.vir_q, DIM);
 381             pr_rvecs(debug, 0, "fshift after LR Corrections", fr->fshift, SHIFTS);
 382             fprintf(debug, "Vlr_lj: %g, Vcorr_lj = %g, Vlr_corr_lj = %g\n",
 383                     Vlr_lj, ewaldOutput.Vcorr_lj, enerd->term[F_LJ_RECIP]);
 384             pr_rvecs(debug, 0, "vir_lj_recip after corr", ewaldOutput.vir_lj, DIM);
 385         }
 386     }
 387
 388     if (debug)
 389     {
 390         print_nrnb(debug, nrnb);
 391     }
 392
 393     if (debug)
 394     {
 395         pr_rvecs(debug, 0, "fshift after bondeds", fr->fshift, SHIFTS);
 396     }
 397
 398 }