src/gromacs/mdrun/md.cpp

   1 /*
   2  * This file is part of the GROMACS molecular simulation package.
   3  *
   4  * Copyright (c) 1991-2000, University of Groningen, The Netherlands.
   5  * Copyright (c) 2001-2004, The GROMACS development team.
   6  * Copyright (c) 2011,2012,2013,2014,2015,2016,2017,2018, by the GROMACS development team, led by
   7  * Mark Abraham, David van der Spoel, Berk Hess, and Erik Lindahl,
   8  * and including many others, as listed in the AUTHORS file in the
   9  * top-level source directory and at http://www.gromacs.org.
  10  *
  11  * GROMACS is free software; you can redistribute it and/or
  12  * modify it under the terms of the GNU Lesser General Public License
  13  * as published by the Free Software Foundation; either version 2.1
  14  * of the License, or (at your option) any later version.
  15  *
  16  * GROMACS is distributed in the hope that it will be useful,
  17  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  18  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  19  * Lesser General Public License for more details.
  20  *
  21  * You should have received a copy of the GNU Lesser General Public
  22  * License along with GROMACS; if not, see
  23  * http://www.gnu.org/licenses, or write to the Free Software Foundation,
  24  * Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA.
  25  *
  26  * If you want to redistribute modifications to GROMACS, please
  27  * consider that scientific software is very special. Version
  28  * control is crucial - bugs must be traceable. We will be happy to
  29  * consider code for inclusion in the official distribution, but
  30  * derived work must not be called official GROMACS. Details are found
  31  * in the README & COPYING files - if they are missing, get the
  32  * official version at http://www.gromacs.org.
  33  *
  34  * To help us fund GROMACS development, we humbly ask that you cite
  35  * the research papers on the package. Check out http://www.gromacs.org.
  36  */
  37 /*! \internal \file
  38  *
  39  * \brief Implements the integrator for normal molecular dynamics simulations
  40  *
  41  * \author David van der Spoel <david.vanderspoel@icm.uu.se>
  42  * \ingroup module_mdrun
  43  */
  44 #include "gmxpre.h"
  45
  46 #include "config.h"
  47
  48 #include <cinttypes>
  49 #include <cmath>
  50 #include <cstdio>
  51 #include <cstdlib>
  52
  53 #include <algorithm>
  54 #include <memory>
  55
  56 #include "gromacs/awh/awh.h"
  57 #include "gromacs/commandline/filenm.h"
  58 #include "gromacs/compat/make_unique.h"
  59 #include "gromacs/domdec/collect.h"
  60 #include "gromacs/domdec/domdec.h"
  61 #include "gromacs/domdec/domdec_network.h"
  62 #include "gromacs/domdec/domdec_struct.h"
  63 #include "gromacs/essentialdynamics/edsam.h"
  64 #include "gromacs/ewald/pme.h"
  65 #include "gromacs/ewald/pme-load-balancing.h"
  66 #include "gromacs/fileio/trxio.h"
  67 #include "gromacs/gmxlib/network.h"
  68 #include "gromacs/gmxlib/nrnb.h"
  69 #include "gromacs/gpu_utils/gpu_utils.h"
  70 #include "gromacs/imd/imd.h"
  71 #include "gromacs/listed-forces/manage-threading.h"
  72 #include "gromacs/math/functions.h"
  73 #include "gromacs/math/utilities.h"
  74 #include "gromacs/math/vec.h"
  75 #include "gromacs/math/vectypes.h"
  76 #include "gromacs/mdlib/checkpointhandler.h"
  77 #include "gromacs/mdlib/compute_io.h"
  78 #include "gromacs/mdlib/constr.h"
  79 #include "gromacs/mdlib/ebin.h"
  80 #include "gromacs/mdlib/expanded.h"
  81 #include "gromacs/mdlib/force.h"
  82 #include "gromacs/mdlib/force_flags.h"
  83 #include "gromacs/mdlib/forcerec.h"
  84 #include "gromacs/mdlib/md_support.h"
  85 #include "gromacs/mdlib/mdatoms.h"
  86 #include "gromacs/mdlib/mdebin.h"
  87 #include "gromacs/mdlib/mdoutf.h"
  88 #include "gromacs/mdlib/mdrun.h"
  89 #include "gromacs/mdlib/mdsetup.h"
  90 #include "gromacs/mdlib/membed.h"
  91 #include "gromacs/mdlib/nb_verlet.h"
  92 #include "gromacs/mdlib/nbnxn_gpu_data_mgmt.h"
  93 #include "gromacs/mdlib/ns.h"
  94 #include "gromacs/mdlib/resethandler.h"
  95 #include "gromacs/mdlib/shellfc.h"
  96 #include "gromacs/mdlib/sighandler.h"
  97 #include "gromacs/mdlib/sim_util.h"
  98 #include "gromacs/mdlib/simulationsignal.h"
  99 #include "gromacs/mdlib/tgroup.h"
 100 #include "gromacs/mdlib/trajectory_writing.h"
 101 #include "gromacs/mdlib/update.h"
 102 #include "gromacs/mdlib/vcm.h"
 103 #include "gromacs/mdlib/vsite.h"
 104 #include "gromacs/mdtypes/awh-history.h"
 105 #include "gromacs/mdtypes/awh-params.h"
 106 #include "gromacs/mdtypes/commrec.h"
 107 #include "gromacs/mdtypes/df_history.h"
 108 #include "gromacs/mdtypes/energyhistory.h"
 109 #include "gromacs/mdtypes/fcdata.h"
 110 #include "gromacs/mdtypes/forcerec.h"
 111 #include "gromacs/mdtypes/group.h"
 112 #include "gromacs/mdtypes/inputrec.h"
 113 #include "gromacs/mdtypes/interaction_const.h"
 114 #include "gromacs/mdtypes/md_enums.h"
 115 #include "gromacs/mdtypes/mdatom.h"
 116 #include "gromacs/mdtypes/observableshistory.h"
 117 #include "gromacs/mdtypes/state.h"
 118 #include "gromacs/pbcutil/mshift.h"
 119 #include "gromacs/pbcutil/pbc.h"
 120 #include "gromacs/pulling/pull.h"
 121 #include "gromacs/swap/swapcoords.h"
 122 #include "gromacs/timing/wallcycle.h"
 123 #include "gromacs/timing/walltime_accounting.h"
 124 #include "gromacs/topology/atoms.h"
 125 #include "gromacs/topology/idef.h"
 126 #include "gromacs/topology/mtop_util.h"
 127 #include "gromacs/topology/topology.h"
 128 #include "gromacs/trajectory/trajectoryframe.h"
 129 #include "gromacs/utility/basedefinitions.h"
 130 #include "gromacs/utility/cstringutil.h"
 131 #include "gromacs/utility/fatalerror.h"
 132 #include "gromacs/utility/logger.h"
 133 #include "gromacs/utility/real.h"
 134 #include "gromacs/utility/smalloc.h"
 135
 136 #include "integrator.h"
 137 #include "replicaexchange.h"
 138
 139 #ifdef GMX_FAHCORE
 140 #include "corewrap.h"
 141 #endif
 142
 143 using gmx::SimulationSignaller;
 144
 145 /*! \brief Copy the state from \p rerunFrame to \p globalState and, if requested, construct vsites
 146  *
 147  * \param[in]     rerunFrame      The trajectory frame to compute energy/forces for
 148  * \param[in,out] globalState     The global state container
 149  * \param[in]     constructVsites When true, vsite coordinates are constructed
 150  * \param[in]     vsite           Vsite setup, can be nullptr when \p constructVsites = false
 151  * \param[in]     idef            Topology parameters, used for constructing vsites
 152  * \param[in]     timeStep        Time step, used for constructing vsites
 153  * \param[in]     forceRec        Force record, used for constructing vsites
 154  * \param[in,out] graph           The molecular graph, used for constructing vsites when != nullptr
 155  * \param[in,out] warnWhenNoV     When true, issue a warning when no velocities are present in \p rerunFrame; is set to false when a warning was issued
 156  */
 157 static void prepareRerunState(const t_trxframe  &rerunFrame,
 158                               t_state           *globalState,
 159                               bool               constructVsites,
 160                               const gmx_vsite_t *vsite,
 161                               const t_idef      &idef,
 162                               double             timeStep,
 163                               const t_forcerec  &forceRec,
 164                               t_graph           *graph,
 165                               gmx_bool          *warnWhenNoV)
 166 {
 167     for (int i = 0; i < globalState->natoms; i++)
 168     {
 169         copy_rvec(rerunFrame.x[i], globalState->x[i]);
 170     }
 171     if (rerunFrame.bV)
 172     {
 173         for (int i = 0; i < globalState->natoms; i++)
 174         {
 175             copy_rvec(rerunFrame.v[i], globalState->v[i]);
 176         }
 177     }
 178     else
 179     {
 180         for (int i = 0; i < globalState->natoms; i++)
 181         {
 182             clear_rvec(globalState->v[i]);
 183         }
 184         if (*warnWhenNoV)
 185         {
 186             fprintf(stderr, "\nWARNING: Some frames do not contain velocities.\n"
 187                     "         Ekin, temperature and pressure are incorrect,\n"
 188                     "         the virial will be incorrect when constraints are present.\n"
 189                     "\n");
 190             *warnWhenNoV = FALSE;
 191         }
 192     }
 193     copy_mat(rerunFrame.box, globalState->box);
 194
 195     if (constructVsites)
 196     {
 197         GMX_ASSERT(vsite, "Need valid vsite for constructing vsites");
 198
 199         if (graph)
 200         {
 201             /* Following is necessary because the graph may get out of sync
 202              * with the coordinates if we only have every N'th coordinate set
 203              */
 204             mk_mshift(nullptr, graph, forceRec.ePBC, globalState->box, as_rvec_array(globalState->x.data()));
 205             shift_self(graph, globalState->box, as_rvec_array(globalState->x.data()));
 206         }
 207         construct_vsites(vsite, as_rvec_array(globalState->x.data()), timeStep, as_rvec_array(globalState->v.data()),
 208                          idef.iparams, idef.il,
 209                          forceRec.ePBC, forceRec.bMolPBC, nullptr, globalState->box);
 210         if (graph)
 211         {
 212             unshift_self(graph, globalState->box, as_rvec_array(globalState->x.data()));
 213         }
 214     }
 215 }
 216
 217 void gmx::Integrator::do_md()
 218 {
 219     // TODO Historically, the EM and MD "integrators" used different
 220     // names for the t_inputrec *parameter, but these must have the
 221     // same name, now that it's a member of a struct. We use this ir
 222     // alias to avoid a large ripple of nearly useless changes.
 223     // t_inputrec is being replaced by IMdpOptionsProvider, so this
 224     // will go away eventually.
 225     t_inputrec       *ir   = inputrec;
 226     gmx_mdoutf       *outf = nullptr;
 227     int64_t           step, step_rel;
 228     double            t, t0, lam0[efptNR];
 229     gmx_bool          bGStatEveryStep, bGStat, bCalcVir, bCalcEnerStep, bCalcEner;
 230     gmx_bool          bNS, bNStList, bSimAnn, bStopCM,
 231                       bFirstStep, bInitStep, bLastStep = FALSE;
 232     gmx_bool          bDoDHDL = FALSE, bDoFEP = FALSE, bDoExpanded = FALSE;
 233     gmx_bool          do_ene, do_log, do_verbose, bRerunWarnNoV = TRUE,
 234                       bForceUpdate = FALSE;
 235     gmx_bool          bMasterState;
 236     int               force_flags, cglo_flags;
 237     tensor            force_vir, shake_vir, total_vir, tmp_vir, pres;
 238     int               i, m;
 239     t_trxstatus      *status;
 240     rvec              mu_tot;
 241     t_vcm            *vcm;
 242     matrix            parrinellorahmanMu, M;
 243     t_trxframe        rerun_fr;
 244     gmx_repl_ex_t     repl_ex = nullptr;
 245     gmx_localtop_t   *top;
 246     t_mdebin         *mdebin   = nullptr;
 247     gmx_enerdata_t   *enerd;
 248     PaddedRVecVector  f {};
 249     gmx_global_stat_t gstat;
 250     gmx_update_t     *upd   = nullptr;
 251     t_graph          *graph = nullptr;
 252     gmx_groups_t     *groups;
 253     gmx_ekindata_t   *ekind;
 254     gmx_shellfc_t    *shellfc;
 255     gmx_bool          bSumEkinhOld, bDoReplEx, bExchanged, bNeedRepartition;
 256     gmx_bool          bTemp, bPres, bTrotter;
 257     real              dvdl_constr;
 258     rvec             *cbuf        = nullptr;
 259     int               cbuf_nalloc = 0;
 260     matrix            lastbox;
 261     int               lamnew  = 0;
 262     /* for FEP */
 263     int               nstfep = 0;
 264     double            cycles;
 265     real              saved_conserved_quantity = 0;
 266     real              last_ekin                = 0;
 267     t_extmass         MassQ;
 268     int             **trotter_seq;
 269     char              sbuf[STEPSTRSIZE], sbuf2[STEPSTRSIZE];
 270     int               handled_stop_condition = gmx_stop_cond_none; /* compare to get_stop_condition*/
 271
 272
 273     /* PME load balancing data for GPU kernels */
 274     pme_load_balancing_t *pme_loadbal      = nullptr;
 275     gmx_bool              bPMETune         = FALSE;
 276     gmx_bool              bPMETunePrinting = FALSE;
 277
 278     /* Interactive MD */
 279     gmx_bool          bIMDstep = FALSE;
 280
 281 #ifdef GMX_FAHCORE
 282     /* Temporary addition for FAHCORE checkpointing */
 283     int chkpt_ret;
 284 #endif
 285     /* Domain decomposition could incorrectly miss a bonded
 286        interaction, but checking for that requires a global
 287        communication stage, which does not otherwise happen in DD
 288        code. So we do that alongside the first global energy reduction
 289        after a new DD is made. These variables handle whether the
 290        check happens, and the result it returns. */
 291     bool              shouldCheckNumberOfBondedInteractions = false;
 292     int               totalNumberOfBondedInteractions       = -1;
 293
 294     SimulationSignals signals;
 295     // Most global communnication stages don't propagate mdrun
 296     // signals, and will use this object to achieve that.
 297     SimulationSignaller nullSignaller(nullptr, nullptr, nullptr, false, false);
 298
 299     if (!mdrunOptions.writeConfout)
 300     {
 301         // This is on by default, and the main known use case for
 302         // turning it off is for convenience in benchmarking, which is
 303         // something that should not show up in the general user
 304         // interface.
 305         GMX_LOG(mdlog.info).asParagraph().
 306             appendText("The -noconfout functionality is deprecated, and may be removed in a future version.");
 307     }
 308
 309     /* md-vv uses averaged full step velocities for T-control
 310        md-vv-avek uses averaged half step velocities for T-control (but full step ekin for P control)
 311        md uses averaged half step kinetic energies to determine temperature unless defined otherwise by GMX_EKIN_AVE_VEL; */
 312     bTrotter = (EI_VV(ir->eI) && (inputrecNptTrotter(ir) || inputrecNphTrotter(ir) || inputrecNvtTrotter(ir)));
 313
 314     const gmx_bool bRerunMD      = mdrunOptions.rerun;
 315     int            nstglobalcomm = mdrunOptions.globalCommunicationInterval;
 316
 317     if (bRerunMD)
 318     {
 319         /* Since we don't know if the frames read are related in any way,
 320          * rebuild the neighborlist at every step.
 321          */
 322         ir->nstlist       = 1;
 323         ir->nstcalcenergy = 1;
 324         nstglobalcomm     = 1;
 325     }
 326
 327     nstglobalcomm   = check_nstglobalcomm(mdlog, nstglobalcomm, ir);
 328     bGStatEveryStep = (nstglobalcomm == 1);
 329
 330     if (bRerunMD)
 331     {
 332         ir->nstxout_compressed = 0;
 333     }
 334     groups = &top_global->groups;
 335
 336     std::unique_ptr<EssentialDynamics> ed = nullptr;
 337     if (opt2bSet("-ei", nfile, fnm) || observablesHistory->edsamHistory != nullptr)
 338     {
 339         /* Initialize essential dynamics sampling */
 340         ed = init_edsam(opt2fn_null("-ei", nfile, fnm), opt2fn("-eo", nfile, fnm),
 341                         top_global,
 342                         ir, cr, constr,
 343                         state_global, observablesHistory,
 344                         oenv, mdrunOptions.continuationOptions.appendFiles);
 345     }
 346
 347     /* Initial values */
 348     init_md(fplog, cr, outputProvider, ir, oenv, mdrunOptions,
 349             &t, &t0, state_global, lam0,
 350             nrnb, top_global, &upd, deform,
 351             nfile, fnm, &outf, &mdebin,
 352             force_vir, shake_vir, total_vir, pres, mu_tot, &bSimAnn, &vcm, wcycle);
 353
 354     /* Energy terms and groups */
 355     snew(enerd, 1);
 356     init_enerdata(top_global->groups.grps[egcENER].nr, ir->fepvals->n_lambda,
 357                   enerd);
 358
 359     /* Kinetic energy data */
 360     snew(ekind, 1);
 361     init_ekindata(fplog, top_global, &(ir->opts), ekind);
 362     /* Copy the cos acceleration to the groups struct */
 363     ekind->cosacc.cos_accel = ir->cos_accel;
 364
 365     gstat = global_stat_init(ir);
 366
 367     /* Check for polarizable models and flexible constraints */
 368     shellfc = init_shell_flexcon(fplog,
 369                                  top_global, constr ? constr->numFlexibleConstraints() : 0,
 370                                  ir->nstcalcenergy, DOMAINDECOMP(cr));
 371
 372     {
 373         double io = compute_io(ir, top_global->natoms, groups, mdebin->ebin->nener, 1);
 374         if ((io > 2000) && MASTER(cr))
 375         {
 376             fprintf(stderr,
 377                     "\nWARNING: This run will generate roughly %.0f Mb of data\n\n",
 378                     io);
 379         }
 380     }
 381
 382     /* Set up interactive MD (IMD) */
 383     init_IMD(ir, cr, ms, top_global, fplog, ir->nstcalcenergy,
 384              MASTER(cr) ? as_rvec_array(state_global->x.data()) : nullptr,
 385              nfile, fnm, oenv, mdrunOptions);
 386
 387     // Local state only becomes valid now.
 388     std::unique_ptr<t_state> stateInstance;
 389     t_state *                state;
 390
 391     if (DOMAINDECOMP(cr))
 392     {
 393         top = dd_init_local_top(top_global);
 394
 395         stateInstance = compat::make_unique<t_state>();
 396         state         = stateInstance.get();
 397         dd_init_local_state(cr->dd, state_global, state);
 398
 399         /* Distribute the charge groups over the nodes from the master node */
 400         dd_partition_system(fplog, mdlog, ir->init_step, cr, TRUE, 1,
 401                             state_global, top_global, ir,
 402                             state, &f, mdAtoms, top, fr,
 403                             vsite, constr,
 404                             nrnb, nullptr, FALSE);
 405         shouldCheckNumberOfBondedInteractions = true;
 406         update_realloc(upd, state->natoms);
 407     }
 408     else
 409     {
 410         state_change_natoms(state_global, state_global->natoms);
 411         /* We need to allocate one element extra, since we might use
 412          * (unaligned) 4-wide SIMD loads to access rvec entries.
 413          */
 414         f.resize(gmx::paddedRVecVectorSize(state_global->natoms));
 415         /* Copy the pointer to the global state */
 416         state = state_global;
 417
 418         snew(top, 1);
 419         mdAlgorithmsSetupAtomData(cr, ir, top_global, top, fr,
 420                                   &graph, mdAtoms, constr, vsite, shellfc);
 421
 422         update_realloc(upd, state->natoms);
 423     }
 424
 425     auto mdatoms = mdAtoms->mdatoms();
 426
 427     // NOTE: The global state is no longer used at this point.
 428     // But state_global is still used as temporary storage space for writing
 429     // the global state to file and potentially for replica exchange.
 430     // (Global topology should persist.)
 431
 432     update_mdatoms(mdatoms, state->lambda[efptMASS]);
 433
 434     const ContinuationOptions &continuationOptions    = mdrunOptions.continuationOptions;
 435     bool                       startingFromCheckpoint = continuationOptions.startedFromCheckpoint;
 436
 437     if (ir->bExpanded)
 438     {
 439         init_expanded_ensemble(startingFromCheckpoint, ir, state->dfhist);
 440     }
 441
 442     if (MASTER(cr))
 443     {
 444         if (startingFromCheckpoint)
 445         {
 446             /* Update mdebin with energy history if appending to output files */
 447             if (continuationOptions.appendFiles)
 448             {
 449                 restore_energyhistory_from_state(mdebin, observablesHistory->energyHistory.get());
 450             }
 451             else if (observablesHistory->energyHistory != nullptr)
 452             {
 453                 /* We might have read an energy history from checkpoint.
 454                  * As we are not appending, we want to restart the statistics.
 455                  * Free the allocated memory and reset the counts.
 456                  */
 457                 observablesHistory->energyHistory = {};
 458             }
 459         }
 460         if (observablesHistory->energyHistory == nullptr)
 461         {
 462             observablesHistory->energyHistory = compat::make_unique<energyhistory_t>();
 463         }
 464         /* Set the initial energy history in state by updating once */
 465         update_energyhistory(observablesHistory->energyHistory.get(), mdebin);
 466     }
 467
 468     // TODO: Remove this by converting AWH into a ForceProvider
 469     auto awh = prepareAwhModule(fplog, *ir, state_global, cr, ms, startingFromCheckpoint,
 470                                 shellfc != nullptr,
 471                                 opt2fn("-awh", nfile, fnm), ir->pull_work);
 472
 473     const bool useReplicaExchange = (replExParams.exchangeInterval > 0);
 474     if (useReplicaExchange && MASTER(cr))
 475     {
 476         repl_ex = init_replica_exchange(fplog, ms, top_global->natoms, ir,
 477                                         replExParams);
 478     }
 479     /* PME tuning is only supported in the Verlet scheme, with PME for
 480      * Coulomb. It is not supported with only LJ PME, or for
 481      * reruns. */
 482     bPMETune = (mdrunOptions.tunePme && EEL_PME(fr->ic->eeltype) && !bRerunMD &&
 483                 !mdrunOptions.reproducible && ir->cutoff_scheme != ecutsGROUP);
 484     if (bPMETune)
 485     {
 486         pme_loadbal_init(&pme_loadbal, cr, mdlog, *ir, state->box,
 487                          *fr->ic, *fr->nbv->listParams, fr->pmedata, use_GPU(fr->nbv),
 488                          &bPMETunePrinting);
 489     }
 490
 491     if (!ir->bContinuation && !bRerunMD)
 492     {
 493         if (state->flags & (1 << estV))
 494         {
 495             /* Set the velocities of vsites, shells and frozen atoms to zero */
 496             for (i = 0; i < mdatoms->homenr; i++)
 497             {
 498                 if (mdatoms->ptype[i] == eptVSite ||
 499                     mdatoms->ptype[i] == eptShell)
 500                 {
 501                     clear_rvec(state->v[i]);
 502                 }
 503                 else if (mdatoms->cFREEZE)
 504                 {
 505                     for (m = 0; m < DIM; m++)
 506                     {
 507                         if (ir->opts.nFreeze[mdatoms->cFREEZE[i]][m])
 508                         {
 509                             state->v[i][m] = 0;
 510                         }
 511                     }
 512                 }
 513             }
 514         }
 515
 516         if (constr)
 517         {
 518             /* Constrain the initial coordinates and velocities */
 519             do_constrain_first(fplog, constr, ir, mdatoms, state);
 520         }
 521         if (vsite)
 522         {
 523             /* Construct the virtual sites for the initial configuration */
 524             construct_vsites(vsite, as_rvec_array(state->x.data()), ir->delta_t, nullptr,
 525                              top->idef.iparams, top->idef.il,
 526                              fr->ePBC, fr->bMolPBC, cr, state->box);
 527         }
 528     }
 529
 530     if (ir->efep != efepNO)
 531     {
 532         /* Set free energy calculation frequency as the greatest common
 533          * denominator of nstdhdl and repl_ex_nst. */
 534         nstfep = ir->fepvals->nstdhdl;
 535         if (ir->bExpanded)
 536         {
 537             nstfep = gmx_greatest_common_divisor(ir->expandedvals->nstexpanded, nstfep);
 538         }
 539         if (useReplicaExchange)
 540         {
 541             nstfep = gmx_greatest_common_divisor(replExParams.exchangeInterval, nstfep);
 542         }
 543     }
 544
 545     /* Be REALLY careful about what flags you set here. You CANNOT assume
 546      * this is the first step, since we might be restarting from a checkpoint,
 547      * and in that case we should not do any modifications to the state.
 548      */
 549     bStopCM = (ir->comm_mode != ecmNO && !ir->bContinuation);
 550
 551     if (continuationOptions.haveReadEkin)
 552     {
 553         restore_ekinstate_from_state(cr, ekind, &state_global->ekinstate);
 554     }
 555
 556     cglo_flags = (CGLO_INITIALIZATION | CGLO_TEMPERATURE | CGLO_GSTAT
 557                   | (EI_VV(ir->eI) ? CGLO_PRESSURE : 0)
 558                   | (EI_VV(ir->eI) ? CGLO_CONSTRAINT : 0)
 559                   | (continuationOptions.haveReadEkin ? CGLO_READEKIN : 0));
 560
 561     bSumEkinhOld = FALSE;
 562     /* To minimize communication, compute_globals computes the COM velocity
 563      * and the kinetic energy for the velocities without COM motion removed.
 564      * Thus to get the kinetic energy without the COM contribution, we need
 565      * to call compute_globals twice.
 566      */
 567     for (int cgloIteration = 0; cgloIteration < (bStopCM ? 2 : 1); cgloIteration++)
 568     {
 569         int cglo_flags_iteration = cglo_flags;
 570         if (bStopCM && cgloIteration == 0)
 571         {
 572             cglo_flags_iteration |= CGLO_STOPCM;
 573             cglo_flags_iteration &= ~CGLO_TEMPERATURE;
 574         }
 575         compute_globals(fplog, gstat, cr, ir, fr, ekind, state, mdatoms, nrnb, vcm,
 576                         nullptr, enerd, force_vir, shake_vir, total_vir, pres, mu_tot,
 577                         constr, &nullSignaller, state->box,
 578                         &totalNumberOfBondedInteractions, &bSumEkinhOld, cglo_flags_iteration
 579                         | (shouldCheckNumberOfBondedInteractions ? CGLO_CHECK_NUMBER_OF_BONDED_INTERACTIONS : 0));
 580     }
 581     checkNumberOfBondedInteractions(mdlog, cr, totalNumberOfBondedInteractions,
 582                                     top_global, top, state,
 583                                     &shouldCheckNumberOfBondedInteractions);
 584     if (ir->eI == eiVVAK)
 585     {
 586         /* a second call to get the half step temperature initialized as well */
 587         /* we do the same call as above, but turn the pressure off -- internally to
 588            compute_globals, this is recognized as a velocity verlet half-step
 589            kinetic energy calculation.  This minimized excess variables, but
 590            perhaps loses some logic?*/
 591
 592         compute_globals(fplog, gstat, cr, ir, fr, ekind, state, mdatoms, nrnb, vcm,
 593                         nullptr, enerd, force_vir, shake_vir, total_vir, pres, mu_tot,
 594                         constr, &nullSignaller, state->box,
 595                         nullptr, &bSumEkinhOld,
 596                         cglo_flags & ~CGLO_PRESSURE);
 597     }
 598
 599     /* Calculate the initial half step temperature, and save the ekinh_old */
 600     if (!continuationOptions.startedFromCheckpoint)
 601     {
 602         for (i = 0; (i < ir->opts.ngtc); i++)
 603         {
 604             copy_mat(ekind->tcstat[i].ekinh, ekind->tcstat[i].ekinh_old);
 605         }
 606     }
 607
 608     /* need to make an initiation call to get the Trotter variables set, as well as other constants for non-trotter
 609        temperature control */
 610     trotter_seq = init_npt_vars(ir, state, &MassQ, bTrotter);
 611
 612     if (MASTER(cr))
 613     {
 614         if (!ir->bContinuation)
 615         {
 616             if (constr && ir->eConstrAlg == econtLINCS)
 617             {
 618                 fprintf(fplog,
 619                         "RMS relative constraint deviation after constraining: %.2e\n",
 620                         constr->rmsd());
 621             }
 622             if (EI_STATE_VELOCITY(ir->eI))
 623             {
 624                 real temp = enerd->term[F_TEMP];
 625                 if (ir->eI != eiVV)
 626                 {
 627                     /* Result of Ekin averaged over velocities of -half
 628                      * and +half step, while we only have -half step here.
 629                      */
 630                     temp *= 2;
 631                 }
 632                 fprintf(fplog, "Initial temperature: %g K\n", temp);
 633             }
 634         }
 635
 636         if (bRerunMD)
 637         {
 638             fprintf(stderr, "starting md rerun '%s', reading coordinates from"
 639                     " input trajectory '%s'\n\n",
 640                     *(top_global->name), opt2fn("-rerun", nfile, fnm));
 641             if (mdrunOptions.verbose)
 642             {
 643                 fprintf(stderr, "Calculated time to finish depends on nsteps from "
 644                         "run input file,\nwhich may not correspond to the time "
 645                         "needed to process input trajectory.\n\n");
 646             }
 647         }
 648         else
 649         {
 650             char tbuf[20];
 651             fprintf(stderr, "starting mdrun '%s'\n",
 652                     *(top_global->name));
 653             if (ir->nsteps >= 0)
 654             {
 655                 sprintf(tbuf, "%8.1f", (ir->init_step+ir->nsteps)*ir->delta_t);
 656             }
 657             else
 658             {
 659                 sprintf(tbuf, "%s", "infinite");
 660             }
 661             if (ir->init_step > 0)
 662             {
 663                 fprintf(stderr, "%s steps, %s ps (continuing from step %s, %8.1f ps).\n",
 664                         gmx_step_str(ir->init_step+ir->nsteps, sbuf), tbuf,
 665                         gmx_step_str(ir->init_step, sbuf2),
 666                         ir->init_step*ir->delta_t);
 667             }
 668             else
 669             {
 670                 fprintf(stderr, "%s steps, %s ps.\n",
 671                         gmx_step_str(ir->nsteps, sbuf), tbuf);
 672             }
 673         }
 674         fprintf(fplog, "\n");
 675     }
 676
 677     walltime_accounting_start_time(walltime_accounting);
 678     wallcycle_start(wcycle, ewcRUN);
 679     print_start(fplog, cr, walltime_accounting, "mdrun");
 680
 681     /* safest point to do file checkpointing is here.  More general point would be immediately before integrator call */
 682 #ifdef GMX_FAHCORE
 683     chkpt_ret = fcCheckPointParallel( cr->nodeid,
 684                                       NULL, 0);
 685     if (chkpt_ret == 0)
 686     {
 687         gmx_fatal( 3, __FILE__, __LINE__, "Checkpoint error on step %d\n", 0 );
 688     }
 689 #endif
 690
 691     /***********************************************************
 692      *
 693      *             Loop over MD steps
 694      *
 695      ************************************************************/
 696
 697     /* if rerunMD then read coordinates and velocities from input trajectory */
 698     if (bRerunMD)
 699     {
 700         if (getenv("GMX_FORCE_UPDATE"))
 701         {
 702             bForceUpdate = TRUE;
 703         }
 704
 705         rerun_fr.natoms = 0;
 706         if (MASTER(cr))
 707         {
 708             bLastStep = !read_first_frame(oenv, &status,
 709                                           opt2fn("-rerun", nfile, fnm),
 710                                           &rerun_fr, TRX_NEED_X | TRX_READ_V);
 711             if (rerun_fr.natoms != top_global->natoms)
 712             {
 713                 gmx_fatal(FARGS,
 714                           "Number of atoms in trajectory (%d) does not match the "
 715                           "run input file (%d)\n",
 716                           rerun_fr.natoms, top_global->natoms);
 717             }
 718             if (ir->ePBC != epbcNONE)
 719             {
 720                 if (!rerun_fr.bBox)
 721                 {
 722                     gmx_fatal(FARGS, "Rerun trajectory frame step %" PRId64 " time %f does not contain a box, while pbc is used", rerun_fr.step, rerun_fr.time);
 723                 }
 724                 if (max_cutoff2(ir->ePBC, rerun_fr.box) < gmx::square(fr->rlist))
 725                 {
 726                     gmx_fatal(FARGS, "Rerun trajectory frame step %" PRId64 " time %f has too small box dimensions", rerun_fr.step, rerun_fr.time);
 727                 }
 728             }
 729         }
 730
 731         if (PAR(cr))
 732         {
 733             rerun_parallel_comm(cr, &rerun_fr, &bLastStep);
 734         }
 735
 736         if (ir->ePBC != epbcNONE)
 737         {
 738             /* Set the shift vectors.
 739              * Necessary here when have a static box different from the tpr box.
 740              */
 741             calc_shifts(rerun_fr.box, fr->shift_vec);
 742         }
 743     }
 744
 745     bFirstStep       = TRUE;
 746     /* Skip the first Nose-Hoover integration when we get the state from tpx */
 747     bInitStep        = !startingFromCheckpoint || EI_VV(ir->eI);
 748     bSumEkinhOld     = FALSE;
 749     bExchanged       = FALSE;
 750     bNeedRepartition = FALSE;
 751
 752     bool simulationsShareState = false;
 753     int  nstSignalComm         = nstglobalcomm;
 754     {
 755         // TODO This implementation of ensemble orientation restraints is nasty because
 756         // a user can't just do multi-sim with single-sim orientation restraints.
 757         bool usingEnsembleRestraints = (fcd->disres.nsystems > 1) || ((ms != nullptr) && (fcd->orires.nr != 0));
 758         bool awhUsesMultiSim         = (ir->bDoAwh && ir->awhParams->shareBiasMultisim && (ms != nullptr));
 759
 760         // Replica exchange, ensemble restraints and AWH need all
 761         // simulations to remain synchronized, so they need
 762         // checkpoints and stop conditions to act on the same step, so
 763         // the propagation of such signals must take place between
 764         // simulations, not just within simulations.
 765         // TODO: Make algorithm initializers set these flags.
 766         simulationsShareState      = useReplicaExchange || usingEnsembleRestraints || awhUsesMultiSim;
 767
 768         signals[eglsSTOPCOND]      = SimulationSignal(!simulationsShareState);
 769
 770         if (simulationsShareState)
 771         {
 772             // Inter-simulation signal communication does not need to happen
 773             // often, so we use a minimum of 200 steps to reduce overhead.
 774             const int c_minimumInterSimulationSignallingInterval = 200;
 775             nstSignalComm = ((c_minimumInterSimulationSignallingInterval + nstglobalcomm - 1)/nstglobalcomm)*nstglobalcomm;
 776         }
 777     }
 778
 779     std::unique_ptr<CheckpointHandler> checkpointHandler = nullptr;
 780
 781     if (!bRerunMD)
 782     {
 783         checkpointHandler = compat::make_unique<CheckpointHandler>(
 784                     compat::make_not_null<SimulationSignal*>(&signals[eglsCHKPT]),
 785                     simulationsShareState, ir->nstlist == 0, MASTER(cr),
 786                     mdrunOptions.writeConfout, mdrunOptions.checkpointOptions.period);
 787     }
 788
 789     const bool resetCountersIsLocal = true;
 790     auto       resetHandler         = compat::make_unique<ResetHandler>(
 791                 compat::make_not_null<SimulationSignal*>(&signals[eglsRESETCOUNTERS]), !resetCountersIsLocal,
 792                 ir->nsteps, MASTER(cr), mdrunOptions.timingOptions.resetHalfway,
 793                 mdrunOptions.maximumHoursToRun, mdlog, wcycle, walltime_accounting);
 794
 795     DdOpenBalanceRegionBeforeForceComputation ddOpenBalanceRegion   = (DOMAINDECOMP(cr) ? DdOpenBalanceRegionBeforeForceComputation::yes : DdOpenBalanceRegionBeforeForceComputation::no);
 796     DdCloseBalanceRegionAfterForceComputation ddCloseBalanceRegion  = (DOMAINDECOMP(cr) ? DdCloseBalanceRegionAfterForceComputation::yes : DdCloseBalanceRegionAfterForceComputation::no);
 797
 798     step     = ir->init_step;
 799     step_rel = 0;
 800
 801     // TODO extract this to new multi-simulation module
 802     if (MASTER(cr) && isMultiSim(ms) && !useReplicaExchange)
 803     {
 804         if (!multisim_int_all_are_equal(ms, ir->nsteps))
 805         {
 806             GMX_LOG(mdlog.warning).appendText(
 807                     "Note: The number of steps is not consistent across multi simulations,\n"
 808                     "but we are proceeding anyway!");
 809         }
 810         if (!multisim_int_all_are_equal(ms, ir->init_step))
 811         {
 812             GMX_LOG(mdlog.warning).appendText(
 813                     "Note: The initial step is not consistent across multi simulations,\n"
 814                     "but we are proceeding anyway!");
 815         }
 816     }
 817
 818     /* and stop now if we should */
 819     bLastStep = (bLastStep || (ir->nsteps >= 0 && step_rel > ir->nsteps));
 820     while (!bLastStep)
 821     {
 822
 823         /* Determine if this is a neighbor search step */
 824         bNStList = (ir->nstlist > 0  && step % ir->nstlist == 0);
 825
 826         if (bPMETune && bNStList)
 827         {
 828             /* PME grid + cut-off optimization with GPUs or PME nodes */
 829             pme_loadbal_do(pme_loadbal, cr,
 830                            (mdrunOptions.verbose && MASTER(cr)) ? stderr : nullptr,
 831                            fplog, mdlog,
 832                            *ir, fr, *state,
 833                            wcycle,
 834                            step, step_rel,
 835                            &bPMETunePrinting);
 836         }
 837
 838         wallcycle_start(wcycle, ewcSTEP);
 839
 840         if (bRerunMD)
 841         {
 842             if (rerun_fr.bStep)
 843             {
 844                 step     = rerun_fr.step;
 845                 step_rel = step - ir->init_step;
 846             }
 847             if (rerun_fr.bTime)
 848             {
 849                 t = rerun_fr.time;
 850             }
 851             else
 852             {
 853                 t = step;
 854             }
 855         }
 856         else
 857         {
 858             bLastStep = (step_rel == ir->nsteps);
 859             t         = t0 + step*ir->delta_t;
 860         }
 861
 862         // TODO Refactor this, so that nstfep does not need a default value of zero
 863         if (ir->efep != efepNO || ir->bSimTemp)
 864         {
 865             /* find and set the current lambdas.  If rerunning, we either read in a state, or a lambda value,
 866                requiring different logic. */
 867             if (bRerunMD)
 868             {
 869                 if (MASTER(cr))
 870                 {
 871                     setCurrentLambdasRerun(step, ir->fepvals, &rerun_fr, lam0, state_global);
 872                 }
 873             }
 874             else
 875             {
 876                 setCurrentLambdasLocal(step, ir->fepvals, lam0, state);
 877             }
 878             bDoDHDL      = do_per_step(step, ir->fepvals->nstdhdl);
 879             bDoFEP       = ((ir->efep != efepNO) && do_per_step(step, nstfep));
 880             bDoExpanded  = (do_per_step(step, ir->expandedvals->nstexpanded)
 881                             && (ir->bExpanded) && (step > 0) && (!startingFromCheckpoint));
 882         }
 883
 884         bDoReplEx = (useReplicaExchange && (step > 0) && !bLastStep &&
 885                      do_per_step(step, replExParams.exchangeInterval));
 886
 887         if (bSimAnn)
 888         {
 889             update_annealing_target_temp(ir, t, upd);
 890         }
 891
 892         if (bRerunMD && MASTER(cr))
 893         {
 894             const bool constructVsites = ((vsite != nullptr) && mdrunOptions.rerunConstructVsites);
 895             if (constructVsites && DOMAINDECOMP(cr))
 896             {
 897                 gmx_fatal(FARGS, "Vsite recalculation with -rerun is not implemented with domain decomposition, use a single rank");
 898             }
 899             prepareRerunState(rerun_fr, state_global, constructVsites, vsite, top->idef, ir->delta_t, *fr, graph, &bRerunWarnNoV);
 900         }
 901
 902         /* Stop Center of Mass motion */
 903         bStopCM = (ir->comm_mode != ecmNO && do_per_step(step, ir->nstcomm));
 904
 905         if (bRerunMD)
 906         {
 907             /* for rerun MD always do Neighbour Searching */
 908             bNS      = (bFirstStep || ir->nstlist != 0);
 909         }
 910         else
 911         {
 912             /* Determine whether or not to do Neighbour Searching */
 913             bNS = (bFirstStep || bNStList || bExchanged || bNeedRepartition);
 914         }
 915
 916         /* < 0 means stop at next step, > 0 means stop at next NS step */
 917         if ( (signals[eglsSTOPCOND].set < 0) ||
 918              ( (signals[eglsSTOPCOND].set > 0 ) && ( bNS || ir->nstlist == 0)))
 919         {
 920             bLastStep = TRUE;
 921         }
 922
 923         /* do_log triggers energy and virial calculation. Because this leads
 924          * to different code paths, forces can be different. Thus for exact
 925          * continuation we should avoid extra log output.
 926          * Note that the || bLastStep can result in non-exact continuation
 927          * beyond the last step. But we don't consider that to be an issue.
 928          */
 929         do_log     = do_per_step(step, ir->nstlog) || (bFirstStep && !startingFromCheckpoint) || bLastStep || bRerunMD;
 930         do_verbose = mdrunOptions.verbose &&
 931             (step % mdrunOptions.verboseStepPrintInterval == 0 || bFirstStep || bLastStep || bRerunMD);
 932
 933         if (bNS && !(bFirstStep && ir->bContinuation && !bRerunMD))
 934         {
 935             if (bRerunMD)
 936             {
 937                 bMasterState = TRUE;
 938             }
 939             else
 940             {
 941                 bMasterState = FALSE;
 942                 /* Correct the new box if it is too skewed */
 943                 if (inputrecDynamicBox(ir))
 944                 {
 945                     if (correct_box(fplog, step, state->box, graph))
 946                     {
 947                         bMasterState = TRUE;
 948                     }
 949                 }
 950                 if (DOMAINDECOMP(cr) && bMasterState)
 951                 {
 952                     dd_collect_state(cr->dd, state, state_global);
 953                 }
 954             }
 955
 956             if (DOMAINDECOMP(cr))
 957             {
 958                 /* Repartition the domain decomposition */
 959                 dd_partition_system(fplog, mdlog, step, cr,
 960                                     bMasterState, nstglobalcomm,
 961                                     state_global, top_global, ir,
 962                                     state, &f, mdAtoms, top, fr,
 963                                     vsite, constr,
 964                                     nrnb, wcycle,
 965                                     do_verbose && !bPMETunePrinting);
 966                 shouldCheckNumberOfBondedInteractions = true;
 967                 update_realloc(upd, state->natoms);
 968             }
 969         }
 970
 971         if (MASTER(cr) && do_log)
 972         {
 973             print_ebin_header(fplog, step, t); /* can we improve the information printed here? */
 974         }
 975
 976         if (ir->efep != efepNO)
 977         {
 978             update_mdatoms(mdatoms, state->lambda[efptMASS]);
 979         }
 980
 981         if ((bRerunMD && rerun_fr.bV) || bExchanged)
 982         {
 983
 984             /* We need the kinetic energy at minus the half step for determining
 985              * the full step kinetic energy and possibly for T-coupling.*/
 986             /* This may not be quite working correctly yet . . . . */
 987             compute_globals(fplog, gstat, cr, ir, fr, ekind, state, mdatoms, nrnb, vcm,
 988                             wcycle, enerd, nullptr, nullptr, nullptr, nullptr, mu_tot,
 989                             constr, &nullSignaller, state->box,
 990                             &totalNumberOfBondedInteractions, &bSumEkinhOld,
 991                             CGLO_GSTAT | CGLO_TEMPERATURE | CGLO_CHECK_NUMBER_OF_BONDED_INTERACTIONS);
 992             checkNumberOfBondedInteractions(mdlog, cr, totalNumberOfBondedInteractions,
 993                                             top_global, top, state,
 994                                             &shouldCheckNumberOfBondedInteractions);
 995         }
 996         clear_mat(force_vir);
 997
 998         if (!bRerunMD)
 999         {
1000             checkpointHandler->decideIfCheckpointingThisStep(bNS, bFirstStep, bLastStep);
1001         }
1002
1003         /* Determine the energy and pressure:
1004          * at nstcalcenergy steps and at energy output steps (set below).
1005          */
1006         if (EI_VV(ir->eI) && (!bInitStep))
1007         {
1008             /* for vv, the first half of the integration actually corresponds
1009                to the previous step.  bCalcEner is only required to be evaluated on the 'next' step,
1010                but the virial needs to be calculated on both the current step and the 'next' step. Future
1011                reorganization may be able to get rid of one of the bCalcVir=TRUE steps. */
1012
1013             /* TODO: This is probably not what we want, we will write to energy file one step after nstcalcenergy steps. */
1014             bCalcEnerStep = do_per_step(step - 1, ir->nstcalcenergy);
1015             bCalcVir      = bCalcEnerStep ||
1016                 (ir->epc != epcNO && (do_per_step(step, ir->nstpcouple) || do_per_step(step-1, ir->nstpcouple)));
1017         }
1018         else
1019         {
1020             bCalcEnerStep = do_per_step(step, ir->nstcalcenergy);
1021             bCalcVir      = bCalcEnerStep ||
1022                 (ir->epc != epcNO && do_per_step(step, ir->nstpcouple));
1023         }
1024         bCalcEner = bCalcEnerStep;
1025
1026         do_ene = (do_per_step(step, ir->nstenergy) || bLastStep || bRerunMD);
1027
1028         if (do_ene || do_log || bDoReplEx)
1029         {
1030             bCalcVir  = TRUE;
1031             bCalcEner = TRUE;
1032         }
1033
1034         /* Do we need global communication ? */
1035         bGStat = (bCalcVir || bCalcEner || bStopCM ||
1036                   do_per_step(step, nstglobalcomm) ||
1037                   (EI_VV(ir->eI) && inputrecNvtTrotter(ir) && do_per_step(step-1, nstglobalcomm)));
1038
1039         force_flags = (GMX_FORCE_STATECHANGED |
1040                        ((inputrecDynamicBox(ir) || bRerunMD) ? GMX_FORCE_DYNAMICBOX : 0) |
1041                        GMX_FORCE_ALLFORCES |
1042                        (bCalcVir ? GMX_FORCE_VIRIAL : 0) |
1043                        (bCalcEner ? GMX_FORCE_ENERGY : 0) |
1044                        (bDoFEP ? GMX_FORCE_DHDL : 0)
1045                        );
1046
1047         if (shellfc)
1048         {
1049             /* Now is the time to relax the shells */
1050             relax_shell_flexcon(fplog, cr, ms, mdrunOptions.verbose,
1051                                 enforcedRotation, step,
1052                                 ir, bNS, force_flags, top,
1053                                 constr, enerd, fcd,
1054                                 state, f, force_vir, mdatoms,
1055                                 nrnb, wcycle, graph, groups,
1056                                 shellfc, fr, t, mu_tot,
1057                                 vsite,
1058                                 ddOpenBalanceRegion, ddCloseBalanceRegion);
1059         }
1060         else
1061         {
1062             /* The AWH history need to be saved _before_ doing force calculations where the AWH bias is updated
1063                (or the AWH update will be performed twice for one step when continuing). It would be best to
1064                call this update function from do_md_trajectory_writing but that would occur after do_force.
1065                One would have to divide the update_awh function into one function applying the AWH force
1066                and one doing the AWH bias update. The update AWH bias function could then be called after
1067                do_md_trajectory_writing (then containing update_awh_history).
1068                The checkpointing will in the future probably moved to the start of the md loop which will
1069                rid of this issue. */
1070             if (awh && !bRerunMD && checkpointHandler->isCheckpointingStep() && MASTER(cr))
1071             {
1072                 awh->updateHistory(state_global->awhHistory.get());
1073             }
1074
1075             /* The coordinates (x) are shifted (to get whole molecules)
1076              * in do_force.
1077              * This is parallellized as well, and does communication too.
1078              * Check comments in sim_util.c
1079              */
1080             do_force(fplog, cr, ms, ir, awh.get(), enforcedRotation,
1081                      step, nrnb, wcycle, top, groups,
1082                      state->box, state->x, &state->hist,
1083                      f, force_vir, mdatoms, enerd, fcd,
1084                      state->lambda, graph,
1085                      fr, vsite, mu_tot, t, ed ? ed->getLegacyED() : nullptr,
1086                      (bNS ? GMX_FORCE_NS : 0) | force_flags,
1087                      ddOpenBalanceRegion, ddCloseBalanceRegion);
1088         }
1089
1090         if (EI_VV(ir->eI) && !startingFromCheckpoint && !bRerunMD)
1091         /*  ############### START FIRST UPDATE HALF-STEP FOR VV METHODS############### */
1092         {
1093             rvec *vbuf = nullptr;
1094
1095             wallcycle_start(wcycle, ewcUPDATE);
1096             if (ir->eI == eiVV && bInitStep)
1097             {
1098                 /* if using velocity verlet with full time step Ekin,
1099                  * take the first half step only to compute the
1100                  * virial for the first step. From there,
1101                  * revert back to the initial coordinates
1102                  * so that the input is actually the initial step.
1103                  */
1104                 snew(vbuf, state->natoms);
1105                 copy_rvecn(as_rvec_array(state->v.data()), vbuf, 0, state->natoms); /* should make this better for parallelizing? */
1106             }
1107             else
1108             {
1109                 /* this is for NHC in the Ekin(t+dt/2) version of vv */
1110                 trotter_update(ir, step, ekind, enerd, state, total_vir, mdatoms, &MassQ, trotter_seq, ettTSEQ1);
1111             }
1112
1113             update_coords(step, ir, mdatoms, state, f, fcd,
1114                           ekind, M, upd, etrtVELOCITY1,
1115                           cr, constr);
1116
1117             if (!bRerunMD || rerun_fr.bV || bForceUpdate)         /* Why is rerun_fr.bV here?  Unclear. */
1118             {
1119                 wallcycle_stop(wcycle, ewcUPDATE);
1120                 constrain_velocities(step, nullptr,
1121                                      state,
1122                                      shake_vir,
1123                                      wcycle, constr,
1124                                      bCalcVir, do_log, do_ene);
1125                 wallcycle_start(wcycle, ewcUPDATE);
1126             }
1127             else if (graph)
1128             {
1129                 /* Need to unshift here if a do_force has been
1130                    called in the previous step */
1131                 unshift_self(graph, state->box, as_rvec_array(state->x.data()));
1132             }
1133             /* if VV, compute the pressure and constraints */
1134             /* For VV2, we strictly only need this if using pressure
1135              * control, but we really would like to have accurate pressures
1136              * printed out.
1137              * Think about ways around this in the future?
1138              * For now, keep this choice in comments.
1139              */
1140             /*bPres = (ir->eI==eiVV || inputrecNptTrotter(ir)); */
1141             /*bTemp = ((ir->eI==eiVV &&(!bInitStep)) || (ir->eI==eiVVAK && inputrecNptTrotter(ir)));*/
1142             bPres = TRUE;
1143             bTemp = ((ir->eI == eiVV && (!bInitStep)) || (ir->eI == eiVVAK));
1144             if (bCalcEner && ir->eI == eiVVAK)
1145             {
1146                 bSumEkinhOld = TRUE;
1147             }
1148             /* for vv, the first half of the integration actually corresponds to the previous step.
1149                So we need information from the last step in the first half of the integration */
1150             if (bGStat || do_per_step(step-1, nstglobalcomm))
1151             {
1152                 wallcycle_stop(wcycle, ewcUPDATE);
1153                 compute_globals(fplog, gstat, cr, ir, fr, ekind, state, mdatoms, nrnb, vcm,
1154                                 wcycle, enerd, force_vir, shake_vir, total_vir, pres, mu_tot,
1155                                 constr, &nullSignaller, state->box,
1156                                 &totalNumberOfBondedInteractions, &bSumEkinhOld,
1157                                 (bGStat ? CGLO_GSTAT : 0)
1158                                 | CGLO_ENERGY
1159                                 | (bTemp ? CGLO_TEMPERATURE : 0)
1160                                 | (bPres ? CGLO_PRESSURE : 0)
1161                                 | (bPres ? CGLO_CONSTRAINT : 0)
1162                                 | (bStopCM ? CGLO_STOPCM : 0)
1163                                 | (shouldCheckNumberOfBondedInteractions ? CGLO_CHECK_NUMBER_OF_BONDED_INTERACTIONS : 0)
1164                                 | CGLO_SCALEEKIN
1165                                 );
1166                 /* explanation of above:
1167                    a) We compute Ekin at the full time step
1168                    if 1) we are using the AveVel Ekin, and it's not the
1169                    initial step, or 2) if we are using AveEkin, but need the full
1170                    time step kinetic energy for the pressure (always true now, since we want accurate statistics).
1171                    b) If we are using EkinAveEkin for the kinetic energy for the temperature control, we still feed in
1172                    EkinAveVel because it's needed for the pressure */
1173                 checkNumberOfBondedInteractions(mdlog, cr, totalNumberOfBondedInteractions,
1174                                                 top_global, top, state,
1175                                                 &shouldCheckNumberOfBondedInteractions);
1176                 wallcycle_start(wcycle, ewcUPDATE);
1177             }
1178             /* temperature scaling and pressure scaling to produce the extended variables at t+dt */
1179             if (!bInitStep)
1180             {
1181                 if (bTrotter)
1182                 {
1183                     m_add(force_vir, shake_vir, total_vir);     /* we need the un-dispersion corrected total vir here */
1184                     trotter_update(ir, step, ekind, enerd, state, total_vir, mdatoms, &MassQ, trotter_seq, ettTSEQ2);
1185
1186                     /* TODO This is only needed when we're about to write
1187                      * a checkpoint, because we use it after the restart
1188                      * (in a kludge?). But what should we be doing if
1189                      * startingFromCheckpoint or bInitStep are true? */
1190                     if (inputrecNptTrotter(ir) || inputrecNphTrotter(ir))
1191                     {
1192                         copy_mat(shake_vir, state->svir_prev);
1193                         copy_mat(force_vir, state->fvir_prev);
1194                     }
1195                     if (inputrecNvtTrotter(ir) && ir->eI == eiVV)
1196                     {
1197                         /* update temperature and kinetic energy now that step is over - this is the v(t+dt) point */
1198                         enerd->term[F_TEMP] = sum_ekin(&(ir->opts), ekind, nullptr, (ir->eI == eiVV), FALSE);
1199                         enerd->term[F_EKIN] = trace(ekind->ekin);
1200                     }
1201                 }
1202                 else if (bExchanged)
1203                 {
1204                     wallcycle_stop(wcycle, ewcUPDATE);
1205                     /* We need the kinetic energy at minus the half step for determining
1206                      * the full step kinetic energy and possibly for T-coupling.*/
1207                     /* This may not be quite working correctly yet . . . . */
1208                     compute_globals(fplog, gstat, cr, ir, fr, ekind, state, mdatoms, nrnb, vcm,
1209                                     wcycle, enerd, nullptr, nullptr, nullptr, nullptr, mu_tot,
1210                                     constr, &nullSignaller, state->box,
1211                                     nullptr, &bSumEkinhOld,
1212                                     CGLO_GSTAT | CGLO_TEMPERATURE);
1213                     wallcycle_start(wcycle, ewcUPDATE);
1214                 }
1215             }
1216             /* if it's the initial step, we performed this first step just to get the constraint virial */
1217             if (ir->eI == eiVV && bInitStep)
1218             {
1219                 copy_rvecn(vbuf, as_rvec_array(state->v.data()), 0, state->natoms);
1220                 sfree(vbuf);
1221             }
1222             wallcycle_stop(wcycle, ewcUPDATE);
1223         }
1224
1225         /* compute the conserved quantity */
1226         if (EI_VV(ir->eI))
1227         {
1228             saved_conserved_quantity = NPT_energy(ir, state, &MassQ);
1229             if (ir->eI == eiVV)
1230             {
1231                 last_ekin = enerd->term[F_EKIN];
1232             }
1233             if ((ir->eDispCorr != edispcEnerPres) && (ir->eDispCorr != edispcAllEnerPres))
1234             {
1235                 saved_conserved_quantity -= enerd->term[F_DISPCORR];
1236             }
1237             /* sum up the foreign energy and dhdl terms for vv.  currently done every step so that dhdl is correct in the .edr */
1238             if (ir->efep != efepNO && !bRerunMD)
1239             {
1240                 sum_dhdl(enerd, state->lambda, ir->fepvals);
1241             }
1242         }
1243
1244         /* ########  END FIRST UPDATE STEP  ############## */
1245         /* ########  If doing VV, we now have v(dt) ###### */
1246         if (bDoExpanded)
1247         {
1248             /* perform extended ensemble sampling in lambda - we don't
1249                actually move to the new state before outputting
1250                statistics, but if performing simulated tempering, we
1251                do update the velocities and the tau_t. */
1252
1253             lamnew = ExpandedEnsembleDynamics(fplog, ir, enerd, state, &MassQ, state->fep_state, state->dfhist, step, as_rvec_array(state->v.data()), mdatoms);
1254             /* history is maintained in state->dfhist, but state_global is what is sent to trajectory and log output */
1255             if (MASTER(cr))
1256             {
1257                 copy_df_history(state_global->dfhist, state->dfhist);
1258             }
1259         }
1260
1261         /* Now we have the energies and forces corresponding to the
1262          * coordinates at time t. We must output all of this before
1263          * the update.
1264          */
1265         do_md_trajectory_writing(fplog, cr, nfile, fnm, step, step_rel, t,
1266                                  ir, state, state_global, observablesHistory,
1267                                  top_global, fr,
1268                                  outf, mdebin, ekind, f,
1269                                  !bRerunMD && checkpointHandler->isCheckpointingStep(),
1270                                  bRerunMD, bLastStep,
1271                                  mdrunOptions.writeConfout,
1272                                  bSumEkinhOld);
1273         /* Check if IMD step and do IMD communication, if bIMD is TRUE. */
1274         bIMDstep = do_IMD(ir->bIMD, step, cr, bNS, state->box, as_rvec_array(state->x.data()), ir, t, wcycle);
1275
1276         /* kludge -- virial is lost with restart for MTTK NPT control. Must reload (saved earlier). */
1277         if (startingFromCheckpoint && (inputrecNptTrotter(ir) || inputrecNphTrotter(ir)))
1278         {
1279             copy_mat(state->svir_prev, shake_vir);
1280             copy_mat(state->fvir_prev, force_vir);
1281         }
1282
1283         double secondsSinceStart = walltime_accounting_get_time_since_start(walltime_accounting);
1284
1285         /* Check whether everything is still allright */
1286         if ((static_cast<int>(gmx_get_stop_condition()) > handled_stop_condition)
1287 #if GMX_THREAD_MPI
1288             && MASTER(cr)
1289 #endif
1290             )
1291         {
1292             int nsteps_stop = -1;
1293
1294             /* this just makes signals[].sig compatible with the hack
1295                of sending signals around by MPI_Reduce together with
1296                other floats */
1297             if ((gmx_get_stop_condition() == gmx_stop_cond_next_ns) ||
1298                 (mdrunOptions.reproducible &&
1299                  gmx_get_stop_condition() == gmx_stop_cond_next))
1300             {
1301                 /* We need at least two global communication steps to pass
1302                  * around the signal. We stop at a pair-list creation step
1303                  * to allow for exact continuation, when possible.
1304                  */
1305                 signals[eglsSTOPCOND].sig = 1;
1306                 nsteps_stop               = std::max(ir->nstlist, 2*nstSignalComm);
1307             }
1308             else if (gmx_get_stop_condition() == gmx_stop_cond_next)
1309             {
1310                 /* Stop directly after the next global communication step.
1311                  * This breaks exact continuation.
1312                  */
1313                 signals[eglsSTOPCOND].sig = -1;
1314                 nsteps_stop               = nstSignalComm + 1;
1315             }
1316             if (fplog)
1317             {
1318                 fprintf(fplog,
1319                         "\n\nReceived the %s signal, stopping within %d steps\n\n",
1320                         gmx_get_signal_name(), nsteps_stop);
1321                 fflush(fplog);
1322             }
1323             fprintf(stderr,
1324                     "\n\nReceived the %s signal, stopping within %d steps\n\n",
1325                     gmx_get_signal_name(), nsteps_stop);
1326             fflush(stderr);
1327             handled_stop_condition = static_cast<int>(gmx_get_stop_condition());
1328         }
1329         else if (MASTER(cr) && (bNS || ir->nstlist <= 0) &&
1330                  (mdrunOptions.maximumHoursToRun > 0 &&
1331                   secondsSinceStart > mdrunOptions.maximumHoursToRun*60.0*60.0*0.99) &&
1332                  signals[eglsSTOPCOND].sig == 0 && signals[eglsSTOPCOND].set == 0)
1333         {
1334             /* Signal to terminate the run */
1335             signals[eglsSTOPCOND].sig = 1;
1336             if (fplog)
1337             {
1338                 fprintf(fplog, "\nStep %s: Run time exceeded %.3f hours, will terminate the run\n",
1339                         gmx_step_str(step, sbuf), mdrunOptions.maximumHoursToRun*0.99);
1340             }
1341             fprintf(stderr, "\nStep %s: Run time exceeded %.3f hours, will terminate the run\n",
1342                     gmx_step_str(step, sbuf), mdrunOptions.maximumHoursToRun*0.99);
1343         }
1344
1345         resetHandler->setSignal(walltime_accounting);
1346
1347         if ((bGStat || !PAR(cr)) && !bRerunMD)
1348         {
1349             /* In parallel we only have to check for checkpointing in steps
1350              * where we do global communication,
1351              *  otherwise the other nodes don't know.
1352              */
1353             checkpointHandler->setSignal(walltime_accounting);
1354
1355         }
1356
1357         /* #########   START SECOND UPDATE STEP ################# */
1358
1359         /* at the start of step, randomize or scale the velocities ((if vv. Restriction of Andersen controlled
1360            in preprocessing */
1361
1362         if (ETC_ANDERSEN(ir->etc)) /* keep this outside of update_tcouple because of the extra info required to pass */
1363         {
1364             gmx_bool bIfRandomize;
1365             bIfRandomize = update_randomize_velocities(ir, step, cr, mdatoms, state, upd, constr);
1366             /* if we have constraints, we have to remove the kinetic energy parallel to the bonds */
1367             if (constr && bIfRandomize)
1368             {
1369                 constrain_velocities(step, nullptr,
1370                                      state,
1371                                      tmp_vir,
1372                                      wcycle, constr,
1373                                      bCalcVir, do_log, do_ene);
1374             }
1375         }
1376         /* Box is changed in update() when we do pressure coupling,
1377          * but we should still use the old box for energy corrections and when
1378          * writing it to the energy file, so it matches the trajectory files for
1379          * the same timestep above. Make a copy in a separate array.
1380          */
1381         copy_mat(state->box, lastbox);
1382
1383         dvdl_constr = 0;
1384
1385         if (!bRerunMD || rerun_fr.bV || bForceUpdate)
1386         {
1387             wallcycle_start(wcycle, ewcUPDATE);
1388             /* UPDATE PRESSURE VARIABLES IN TROTTER FORMULATION WITH CONSTRAINTS */
1389             if (bTrotter)
1390             {
1391                 trotter_update(ir, step, ekind, enerd, state, total_vir, mdatoms, &MassQ, trotter_seq, ettTSEQ3);
1392                 /* We can only do Berendsen coupling after we have summed
1393                  * the kinetic energy or virial. Since the happens
1394                  * in global_state after update, we should only do it at
1395                  * step % nstlist = 1 with bGStatEveryStep=FALSE.
1396                  */
1397             }
1398             else
1399             {
1400                 update_tcouple(step, ir, state, ekind, &MassQ, mdatoms);
1401                 update_pcouple_before_coordinates(fplog, step, ir, state,
1402                                                   parrinellorahmanMu, M,
1403                                                   bInitStep);
1404             }
1405
1406             if (EI_VV(ir->eI))
1407             {
1408                 /* velocity half-step update */
1409                 update_coords(step, ir, mdatoms, state, f, fcd,
1410                               ekind, M, upd, etrtVELOCITY2,
1411                               cr, constr);
1412             }
1413
1414             /* Above, initialize just copies ekinh into ekin,
1415              * it doesn't copy position (for VV),
1416              * and entire integrator for MD.
1417              */
1418
1419             if (ir->eI == eiVVAK)
1420             {
1421                 /* We probably only need md->homenr, not state->natoms */
1422                 if (state->natoms > cbuf_nalloc)
1423                 {
1424                     cbuf_nalloc = state->natoms;
1425                     srenew(cbuf, cbuf_nalloc);
1426                 }
1427                 copy_rvecn(as_rvec_array(state->x.data()), cbuf, 0, state->natoms);
1428             }
1429
1430             update_coords(step, ir, mdatoms, state, f, fcd,
1431                           ekind, M, upd, etrtPOSITION, cr, constr);
1432             wallcycle_stop(wcycle, ewcUPDATE);
1433
1434             constrain_coordinates(step, &dvdl_constr, state,
1435                                   shake_vir,
1436                                   wcycle, upd, constr,
1437                                   bCalcVir, do_log, do_ene);
1438             update_sd_second_half(step, &dvdl_constr, ir, mdatoms, state,
1439                                   cr, nrnb, wcycle, upd, constr, do_log, do_ene);
1440             finish_update(ir, mdatoms,
1441                           state, graph,
1442                           nrnb, wcycle, upd, constr);
1443
1444             if (ir->eI == eiVVAK)
1445             {
1446                 /* erase F_EKIN and F_TEMP here? */
1447                 /* just compute the kinetic energy at the half step to perform a trotter step */
1448                 compute_globals(fplog, gstat, cr, ir, fr, ekind, state, mdatoms, nrnb, vcm,
1449                                 wcycle, enerd, force_vir, shake_vir, total_vir, pres, mu_tot,
1450                                 constr, &nullSignaller, lastbox,
1451                                 nullptr, &bSumEkinhOld,
1452                                 (bGStat ? CGLO_GSTAT : 0) | CGLO_TEMPERATURE
1453                                 );
1454                 wallcycle_start(wcycle, ewcUPDATE);
1455                 trotter_update(ir, step, ekind, enerd, state, total_vir, mdatoms, &MassQ, trotter_seq, ettTSEQ4);
1456                 /* now we know the scaling, we can compute the positions again again */
1457                 copy_rvecn(cbuf, as_rvec_array(state->x.data()), 0, state->natoms);
1458
1459                 update_coords(step, ir, mdatoms, state, f, fcd,
1460                               ekind, M, upd, etrtPOSITION, cr, constr);
1461                 wallcycle_stop(wcycle, ewcUPDATE);
1462
1463                 /* do we need an extra constraint here? just need to copy out of as_rvec_array(state->v.data()) to upd->xp? */
1464                 /* are the small terms in the shake_vir here due
1465                  * to numerical errors, or are they important
1466                  * physically? I'm thinking they are just errors, but not completely sure.
1467                  * For now, will call without actually constraining, constr=NULL*/
1468                 finish_update(ir, mdatoms,
1469                               state, graph,
1470                               nrnb, wcycle, upd, nullptr);
1471             }
1472             if (EI_VV(ir->eI))
1473             {
1474                 /* this factor or 2 correction is necessary
1475                    because half of the constraint force is removed
1476                    in the vv step, so we have to double it.  See
1477                    the Redmine issue #1255.  It is not yet clear
1478                    if the factor of 2 is exact, or just a very
1479                    good approximation, and this will be
1480                    investigated.  The next step is to see if this
1481                    can be done adding a dhdl contribution from the
1482                    rattle step, but this is somewhat more
1483                    complicated with the current code. Will be
1484                    investigated, hopefully for 4.6.3. However,
1485                    this current solution is much better than
1486                    having it completely wrong.
1487                  */
1488                 enerd->term[F_DVDL_CONSTR] += 2*dvdl_constr;
1489             }
1490             else
1491             {
1492                 enerd->term[F_DVDL_CONSTR] += dvdl_constr;
1493             }
1494         }
1495         else if (graph)
1496         {
1497             /* Need to unshift here */
1498             unshift_self(graph, state->box, as_rvec_array(state->x.data()));
1499         }
1500
1501         if (vsite != nullptr)
1502         {
1503             wallcycle_start(wcycle, ewcVSITECONSTR);
1504             if (graph != nullptr)
1505             {
1506                 shift_self(graph, state->box, as_rvec_array(state->x.data()));
1507             }
1508             construct_vsites(vsite, as_rvec_array(state->x.data()), ir->delta_t, as_rvec_array(state->v.data()),
1509                              top->idef.iparams, top->idef.il,
1510                              fr->ePBC, fr->bMolPBC, cr, state->box);
1511
1512             if (graph != nullptr)
1513             {
1514                 unshift_self(graph, state->box, as_rvec_array(state->x.data()));
1515             }
1516             wallcycle_stop(wcycle, ewcVSITECONSTR);
1517         }
1518
1519         /* ############## IF NOT VV, Calculate globals HERE  ############ */
1520         /* With Leap-Frog we can skip compute_globals at
1521          * non-communication steps, but we need to calculate
1522          * the kinetic energy one step before communication.
1523          */
1524         {
1525             // Organize to do inter-simulation signalling on steps if
1526             // and when algorithms require it.
1527             bool doInterSimSignal = (simulationsShareState && do_per_step(step, nstSignalComm));
1528
1529             if (bGStat || (!EI_VV(ir->eI) && do_per_step(step+1, nstglobalcomm)) || doInterSimSignal)
1530             {
1531                 // Since we're already communicating at this step, we
1532                 // can propagate intra-simulation signals. Note that
1533                 // check_nstglobalcomm has the responsibility for
1534                 // choosing the value of nstglobalcomm that is one way
1535                 // bGStat becomes true, so we can't get into a
1536                 // situation where e.g. checkpointing can't be
1537                 // signalled.
1538                 bool                doIntraSimSignal = true;
1539                 SimulationSignaller signaller(&signals, cr, ms, doInterSimSignal, doIntraSimSignal);
1540
1541                 compute_globals(fplog, gstat, cr, ir, fr, ekind, state, mdatoms, nrnb, vcm,
1542                                 wcycle, enerd, force_vir, shake_vir, total_vir, pres, mu_tot,
1543                                 constr, &signaller,
1544                                 lastbox,
1545                                 &totalNumberOfBondedInteractions, &bSumEkinhOld,
1546                                 (bGStat ? CGLO_GSTAT : 0)
1547                                 | (!EI_VV(ir->eI) || bRerunMD ? CGLO_ENERGY : 0)
1548                                 | (!EI_VV(ir->eI) && bStopCM ? CGLO_STOPCM : 0)
1549                                 | (!EI_VV(ir->eI) ? CGLO_TEMPERATURE : 0)
1550                                 | (!EI_VV(ir->eI) || bRerunMD ? CGLO_PRESSURE : 0)
1551                                 | CGLO_CONSTRAINT
1552                                 | (shouldCheckNumberOfBondedInteractions ? CGLO_CHECK_NUMBER_OF_BONDED_INTERACTIONS : 0)
1553                                 );
1554                 checkNumberOfBondedInteractions(mdlog, cr, totalNumberOfBondedInteractions,
1555                                                 top_global, top, state,
1556                                                 &shouldCheckNumberOfBondedInteractions);
1557             }
1558         }
1559
1560         /* #############  END CALC EKIN AND PRESSURE ################# */
1561
1562         /* Note: this is OK, but there are some numerical precision issues with using the convergence of
1563            the virial that should probably be addressed eventually. state->veta has better properies,
1564            but what we actually need entering the new cycle is the new shake_vir value. Ideally, we could
1565            generate the new shake_vir, but test the veta value for convergence.  This will take some thought. */
1566
1567         if (ir->efep != efepNO && (!EI_VV(ir->eI) || bRerunMD))
1568         {
1569             /* Sum up the foreign energy and dhdl terms for md and sd.
1570                Currently done every step so that dhdl is correct in the .edr */
1571             sum_dhdl(enerd, state->lambda, ir->fepvals);
1572         }
1573
1574         update_pcouple_after_coordinates(fplog, step, ir, mdatoms,
1575                                          pres, force_vir, shake_vir,
1576                                          parrinellorahmanMu,
1577                                          state, nrnb, upd);
1578
1579         /* ################# END UPDATE STEP 2 ################# */
1580         /* #### We now have r(t+dt) and v(t+dt/2)  ############# */
1581
1582         /* The coordinates (x) were unshifted in update */
1583         if (!bGStat)
1584         {
1585             /* We will not sum ekinh_old,
1586              * so signal that we still have to do it.
1587              */
1588             bSumEkinhOld = TRUE;
1589         }
1590
1591         if (bCalcEner)
1592         {
1593             /* #########  BEGIN PREPARING EDR OUTPUT  ###########  */
1594
1595             /* use the directly determined last velocity, not actually the averaged half steps */
1596             if (bTrotter && ir->eI == eiVV)
1597             {
1598                 enerd->term[F_EKIN] = last_ekin;
1599             }
1600             enerd->term[F_ETOT] = enerd->term[F_EPOT] + enerd->term[F_EKIN];
1601
1602             if (integratorHasConservedEnergyQuantity(ir))
1603             {
1604                 if (EI_VV(ir->eI))
1605                 {
1606                     enerd->term[F_ECONSERVED] = enerd->term[F_ETOT] + saved_conserved_quantity;
1607                 }
1608                 else
1609                 {
1610                     enerd->term[F_ECONSERVED] = enerd->term[F_ETOT] + NPT_energy(ir, state, &MassQ);
1611                 }
1612             }
1613             /* #########  END PREPARING EDR OUTPUT  ###########  */
1614         }
1615
1616         /* Output stuff */
1617         if (MASTER(cr))
1618         {
1619             if (fplog && do_log && bDoExpanded)
1620             {
1621                 /* only needed if doing expanded ensemble */
1622                 PrintFreeEnergyInfoToFile(fplog, ir->fepvals, ir->expandedvals, ir->bSimTemp ? ir->simtempvals : nullptr,
1623                                           state_global->dfhist, state->fep_state, ir->nstlog, step);
1624             }
1625             if (bCalcEner)
1626             {
1627                 upd_mdebin(mdebin, bDoDHDL, bCalcEnerStep,
1628                            t, mdatoms->tmass, enerd, state,
1629                            ir->fepvals, ir->expandedvals, lastbox,
1630                            shake_vir, force_vir, total_vir, pres,
1631                            ekind, mu_tot, constr);
1632             }
1633             else
1634             {
1635                 upd_mdebin_step(mdebin);
1636             }
1637
1638             gmx_bool do_dr  = do_per_step(step, ir->nstdisreout);
1639             gmx_bool do_or  = do_per_step(step, ir->nstorireout);
1640
1641             print_ebin(mdoutf_get_fp_ene(outf), do_ene, do_dr, do_or, do_log ? fplog : nullptr,
1642                        step, t,
1643                        eprNORMAL, mdebin, fcd, groups, &(ir->opts), awh.get());
1644
1645             if (ir->bPull)
1646             {
1647                 pull_print_output(ir->pull_work, step, t);
1648             }
1649
1650             if (do_per_step(step, ir->nstlog))
1651             {
1652                 if (fflush(fplog) != 0)
1653                 {
1654                     gmx_fatal(FARGS, "Cannot flush logfile - maybe you are out of disk space?");
1655                 }
1656             }
1657         }
1658         if (bDoExpanded)
1659         {
1660             /* Have to do this part _after_ outputting the logfile and the edr file */
1661             /* Gets written into the state at the beginning of next loop*/
1662             state->fep_state = lamnew;
1663         }
1664         /* Print the remaining wall clock time for the run */
1665         if (isMasterSimMasterRank(ms, cr) &&
1666             (do_verbose || gmx_got_usr_signal()) &&
1667             !bPMETunePrinting)
1668         {
1669             if (shellfc)
1670             {
1671                 fprintf(stderr, "\n");
1672             }
1673             print_time(stderr, walltime_accounting, step, ir, cr);
1674         }
1675
1676         /* Ion/water position swapping.
1677          * Not done in last step since trajectory writing happens before this call
1678          * in the MD loop and exchanges would be lost anyway. */
1679         bNeedRepartition = FALSE;
1680         if ((ir->eSwapCoords != eswapNO) && (step > 0) && !bLastStep &&
1681             do_per_step(step, ir->swap->nstswap))
1682         {
1683             bNeedRepartition = do_swapcoords(cr, step, t, ir, wcycle,
1684                                              bRerunMD ? rerun_fr.x   : as_rvec_array(state->x.data()),
1685                                              bRerunMD ? rerun_fr.box : state->box,
1686                                              MASTER(cr) && mdrunOptions.verbose,
1687                                              bRerunMD);
1688
1689             if (bNeedRepartition && DOMAINDECOMP(cr))
1690             {
1691                 dd_collect_state(cr->dd, state, state_global);
1692             }
1693         }
1694
1695         /* Replica exchange */
1696         bExchanged = FALSE;
1697         if (bDoReplEx)
1698         {
1699             bExchanged = replica_exchange(fplog, cr, ms, repl_ex,
1700                                           state_global, enerd,
1701                                           state, step, t);
1702         }
1703
1704         if ( (bExchanged || bNeedRepartition) && DOMAINDECOMP(cr) )
1705         {
1706             dd_partition_system(fplog, mdlog, step, cr, TRUE, 1,
1707                                 state_global, top_global, ir,
1708                                 state, &f, mdAtoms, top, fr,
1709                                 vsite, constr,
1710                                 nrnb, wcycle, FALSE);
1711             shouldCheckNumberOfBondedInteractions = true;
1712             update_realloc(upd, state->natoms);
1713         }
1714
1715         bFirstStep             = FALSE;
1716         bInitStep              = FALSE;
1717         startingFromCheckpoint = false;
1718
1719         /* #######  SET VARIABLES FOR NEXT ITERATION IF THEY STILL NEED IT ###### */
1720         /* With all integrators, except VV, we need to retain the pressure
1721          * at the current step for coupling at the next step.
1722          */
1723         if ((state->flags & (1<<estPRES_PREV)) &&
1724             (bGStatEveryStep ||
1725              (ir->nstpcouple > 0 && step % ir->nstpcouple == 0)))
1726         {
1727             /* Store the pressure in t_state for pressure coupling
1728              * at the next MD step.
1729              */
1730             copy_mat(pres, state->pres_prev);
1731         }
1732
1733         /* #######  END SET VARIABLES FOR NEXT ITERATION ###### */
1734
1735         if ( (membed != nullptr) && (!bLastStep) )
1736         {
1737             rescale_membed(step_rel, membed, as_rvec_array(state_global->x.data()));
1738         }
1739
1740         if (bRerunMD)
1741         {
1742             if (MASTER(cr))
1743             {
1744                 /* read next frame from input trajectory */
1745                 bLastStep = !read_next_frame(oenv, status, &rerun_fr);
1746             }
1747
1748             if (PAR(cr))
1749             {
1750                 rerun_parallel_comm(cr, &rerun_fr, &bLastStep);
1751             }
1752         }
1753
1754         cycles = wallcycle_stop(wcycle, ewcSTEP);
1755         if (DOMAINDECOMP(cr) && wcycle)
1756         {
1757             dd_cycles_add(cr->dd, cycles, ddCyclStep);
1758         }
1759
1760         if (!bRerunMD || !rerun_fr.bStep)
1761         {
1762             /* increase the MD step number */
1763             step++;
1764             step_rel++;
1765         }
1766
1767         resetHandler->resetCounters(
1768                 step, step_rel, mdlog, fplog, cr, (use_GPU(fr->nbv) ? fr->nbv : nullptr),
1769                 nrnb, fr->pmedata, pme_loadbal, wcycle, walltime_accounting);
1770
1771         /* If bIMD is TRUE, the master updates the IMD energy record and sends positions to VMD client */
1772         IMD_prep_energies_send_positions(ir->bIMD && MASTER(cr), bIMDstep, ir->imd, enerd, step, bCalcEner, wcycle);
1773
1774     }
1775     /* End of main MD loop */
1776
1777     /* Closing TNG files can include compressing data. Therefore it is good to do that
1778      * before stopping the time measurements. */
1779     mdoutf_tng_close(outf);
1780
1781     /* Stop measuring walltime */
1782     walltime_accounting_end_time(walltime_accounting);
1783
1784     if (bRerunMD && MASTER(cr))
1785     {
1786         close_trx(status);
1787     }
1788
1789     if (!thisRankHasDuty(cr, DUTY_PME))
1790     {
1791         /* Tell the PME only node to finish */
1792         gmx_pme_send_finish(cr);
1793     }
1794
1795     if (MASTER(cr))
1796     {
1797         if (ir->nstcalcenergy > 0 && !bRerunMD)
1798         {
1799             print_ebin(mdoutf_get_fp_ene(outf), FALSE, FALSE, FALSE, fplog, step, t,
1800                        eprAVER, mdebin, fcd, groups, &(ir->opts), awh.get());
1801         }
1802     }
1803     done_mdebin(mdebin);
1804     done_mdoutf(outf);
1805
1806     if (bPMETune)
1807     {
1808         pme_loadbal_done(pme_loadbal, fplog, mdlog, use_GPU(fr->nbv));
1809     }
1810
1811     done_shellfc(fplog, shellfc, step_rel);
1812
1813     if (useReplicaExchange && MASTER(cr))
1814     {
1815         print_replica_exchange_statistics(fplog, repl_ex);
1816     }
1817
1818     // Clean up swapcoords
1819     if (ir->eSwapCoords != eswapNO)
1820     {
1821         finish_swapcoords(ir->swap);
1822     }
1823
1824     /* IMD cleanup, if bIMD is TRUE. */
1825     IMD_finalize(ir->bIMD, ir->imd);
1826
1827     walltime_accounting_set_nsteps_done(walltime_accounting, step);
1828
1829     destroy_enerdata(enerd);
1830     sfree(enerd);
1831     sfree(top);
1832 }