Improve doxygen in some nblib listed forces files

[alexxy/gromacs.git] / api / nblib / listed_forces / kernels.hpp
diff --git a/api/nblib/listed_forces/kernels.hpp b/api/nblib/listed_forces/kernels.hpp

index 425820bb10dbd33ea344332451b7b4acdaff5961..e21f483c3e8b74c0316fc356a116aebd687e0f3a 100644 (file)
--- a/api/nblib/listed_forces/kernels.hpp
+++ b/api/nblib/listed_forces/kernels.hpp
@@ -47,9 +47,9 @@
  
  #include <tuple>
  
-#include "gromacs/math/vec.h"
-#include "nblib/basicdefinitions.h"
-#include "bondtypes.h"
+#include "gromacs/math/functions.h"
+#include "gromacs/math/vectypes.h"
+#include "nblib/listed_forces/bondtypes.h"
  
  namespace nblib
  {
@@ -114,7 +114,7 @@ inline std::tuple<T, T, T> harmonicScalarForce(T kA, T kB, T xA, T xB, T x, T la
  template <class T>
  inline auto bondKernel(T dr, const HarmonicBondType& bond)
  {
-    return harmonicScalarForce(bond.forceConstant(), bond.equilDistance(), dr);
+    return harmonicScalarForce(bond.forceConstant(), bond.equilConstant(), dr);
  }
  
  
@@ -133,12 +133,12 @@ inline std::tuple<T, T> g96ScalarForce(T k, T x0, T x)
      T dx  = x - x0;
      T dx2 = dx * dx;
  
-    T force = -k * dx * x;
-    T epot = 0.25 * k * dx2;
+    T force = -k * dx;
+    T epot = 0.5 * k * dx2;
  
      return std::make_tuple(force, epot);
  
-    /* That was 7 flops */
+    /* That was 6 flops */
  }
  
  /*! \brief kernel to calculate the scalar part for forth power pontential bond forces
@@ -163,8 +163,8 @@ inline std::tuple<T, T, T> g96ScalarForce(T kA, T kB, T xA, T xB, T x, T lambda)
      T dx  = x - x0;
      T dx2 = dx * dx;
  
-    T force = -kk * dx * x;
-    T epot = 0.25 * kk * dx2;
+    T force = -kk * dx;
+    T epot = 0.5 * kk * dx2;
      // TODO: Check if this is 1/2 or 1/4
      T dvdlambda = 0.5 * (kB - kA) * dx2 + (xA - xB) * kk * dx;
  
@@ -173,12 +173,14 @@ inline std::tuple<T, T, T> g96ScalarForce(T kA, T kB, T xA, T xB, T x, T lambda)
      /* That was 21 flops */
  }
  
-//! Abstraction layer for different 2-center bonds. Forth power case
+//! Abstraction layer for different 2-center bonds. Fourth power case
  template <class T>
  inline auto bondKernel(T dr, const G96BondType& bond)
  {
-    // NOTE: Not assuming GROMACS' convention of storing squared bond.equilDistance() for this type
-    return g96ScalarForce(bond.forceConstant(), bond.equilDistance() * bond.equilDistance(), dr * dr);
+    auto [force, ePot] = g96ScalarForce(bond.forceConstant(), bond.equilConstant(), dr*dr);
+    force *= dr;
+    ePot  *= 0.5;
+    return std::make_tuple(force, ePot);
  }
  
  
@@ -200,11 +202,11 @@ inline std::tuple<T, T> morseScalarForce(T k, T beta, T x0, T x)
      T kexp = k * omexp;                           /*  1 */
  
      T epot = kexp * omexp;                        /*  1 */
-    T force = -2.0 * beta * exponent * omexp;     /*  4 */
+    T force = -2.0 * beta * exponent * kexp;      /*  4 */
  
      return std::make_tuple(force, epot);
  
-    /* That was 23 flops */
+    /* That was 20 flops */
  }
  
  /*! \brief kernel to calculate the scalar part for morse potential bond forces
@@ -234,7 +236,7 @@ inline std::tuple<T, T, T> morseScalarForce(T kA, T kB, T betaA, T betaB, T xA,
      T kexp = k * omexp;                           /*  1 */
  
      T epot = kexp * omexp;                        /*  1 */
-    T force = -2.0 * beta * exponent * omexp;     /*  4 */
+    T force = -2.0 * beta * exponent * kexp;      /*  4 */
  
      T dvdlambda = (kB - kA) * omexp * omexp
                      - (2.0 - 2.0 * omexp) * omexp * k
@@ -252,6 +254,40 @@ inline auto bondKernel(T dr, const MorseBondType& bond)
      return morseScalarForce(bond.forceConstant(), bond.exponent(), bond.equilDistance(), dr);
  }
  
+/*! \brief kernel to calculate the scalar part for the 1-4 LJ non-bonded forces
+ *
+ * \param c6  C6 parameter of LJ potential
+ * \param c12 C12 parameter of LJ potential
+ * \param r   distance between the atoms
+ *
+ * \return tuple<force, potential energy>
+ */
+template <class T>
+inline std::tuple<T, T> pairLJScalarForce(C6 c6, C12 c12, T r)
+{
+    T rinv  = 1./r;                           /* 1 */
+    T rinv2 = rinv * rinv;                    /* 1 */
+    T rinv6 = rinv2 * rinv2 * rinv2;          /* 2 */
+
+    T epot  = rinv6*(c12*rinv6 - c6);         /* 3 */
+
+    T c6_     = 6.*c6;                        /* 1 */
+    T c12_    = 12.*c12;                      /* 1 */
+
+    T force = rinv6*(c12_*rinv6 - c6_)*rinv;  /* 4 */
+
+    return std::make_tuple(force, epot);
+
+    /* That was 13 flops */
+}
+
+//! Abstraction layer for different 2-center bonds. 1-4 LJ pair interactions case
+template <class T>
+inline auto bondKernel(T dr, const PairLJType& bond)
+{
+    return pairLJScalarForce(bond.c6(), bond.c12(), dr);
+}
+
  
  /*! \brief kernel to calculate the scalar part for the FENE pontential bond forces
   *         for lambda = 0
@@ -271,7 +307,7 @@ inline std::tuple<T, T> FENEScalarForce(T k, T x0, T x)
      T omx2_ox02 = 1.0 - (x2 / x02);
  
      T epot = -0.5 * k * x02 * std::log(omx2_ox02);
-    T force = -k * x / omx2_ox02;
+    T force = -k / omx2_ox02;
  
      return std::make_tuple(force, epot);
  
@@ -284,7 +320,9 @@ inline std::tuple<T, T> FENEScalarForce(T k, T x0, T x)
  template <class T>
  inline auto bondKernel(T dr, const FENEBondType& bond)
  {
-    return FENEScalarForce(bond.forceConstant(), bond.equilDistance(), dr);
+    auto [force, ePot] = FENEScalarForce(bond.forceConstant(), bond.equilConstant(), dr);
+    force *= dr;
+    return std::make_tuple(force, ePot);
  }
  
  
@@ -302,6 +340,7 @@ template <class T>
  inline std::tuple<T, T> cubicScalarForce(T kc, T kq, T x0, T x)
  {
      T dx = x - x0;
+    //T dx2 = dx * dx;
  
      T kdist  = kq * dx;
      T kdist2 = kdist * dx;
@@ -384,37 +423,193 @@ inline std::tuple<T, T, T> halfAttractiveScalarForce(T kA, T kB, T xA, T xB, T x
  template <class T>
  inline auto bondKernel(T dr, const HalfAttractiveQuarticBondType& bond)
  {
-    return halfAttractiveScalarForce(bond.forceConstant(), bond.equilDistance(), dr);
+    return halfAttractiveScalarForce(bond.forceConstant(), bond.equilConstant(), dr);
  }
  
  
  //! Three-center interaction type kernels
  
-// linear angles go here
-// quartic angles go here
+/*! \brief kernel to calculate the scalar part for linear angle forces
+ *         for lambda = 0
+ *
+ * \param k force constant
+ * \param a0 equilibrium angle
+ * \param angle current angle vaule
+ *
+ * \return tuple<force, potential energy>
+ */
+template <class T>
+inline std::tuple<T, T, T> linearAnglesScalarForce(T k, T a0, T angle)
+{
+    T b = T(1.0) - a0;
+
+    T kdr  = k * angle;
+    T epot = 0.5 * kdr * angle;
+
+    T ci = a0 * k;
+    T ck = b * k;
+
+    return std::make_tuple(ci, ck, epot);
+
+    /* That was 5 flops */
+}
+
+template <class T>
+inline auto threeCenterKernel(T dr, const LinearAngle& angle)
+{
+    return linearAnglesScalarForce(angle.forceConstant(), angle.equilConstant(), dr);
+}
+
+//! Harmonic Angle
+template <class T>
+inline auto threeCenterKernel(T dr, const HarmonicAngle& angle)
+{
+    return harmonicScalarForce(angle.forceConstant(), angle.equilConstant(), dr);
+}
+
+//! Cosine based (GROMOS-96) Angle
+template <class T>
+inline auto threeCenterKernel(T dr, const G96Angle& angle)
+{
+    auto costheta = std::cos(dr);
+    auto feTuple = g96ScalarForce(angle.forceConstant(), angle.equilConstant(), costheta);
+
+    // The above kernel call effectively computes the derivative of the potential with respect to
+    // cos(theta). However, we need the derivative with respect to theta. We use this extra -sin(theta)
+    // factor to account for this before the forces are spread between the particles.
+
+    std::get<0>(feTuple) *= -std::sqrt(1 - costheta*costheta);
+    return feTuple;
+}
+
+/*! \brief kernel to calculate the scalar part for cross bond-bond forces
+ *         for lambda = 0
+ *
+ * \param k force constant
+ * \param r0ij equilibrium distance between particles i & j
+ * \param r0kj equilibrium distance between particles k & j
+ * \param rij  input bond length between particles i & j
+ * \param rkj  input bond length between particles k & j
+ *
+ * \return tuple<force scalar i, force scalar k, potential energy>
+ */
+
+template <class T>
+inline std::tuple<T, T, T> crossBondBondScalarForce(T k, T r0ij, T r0kj, T rij, T rkj)
+{
+    T si = rij - r0ij;
+    T sk = rkj - r0kj;
+
+    T epot = k * si * sk;
+
+    T ci = -k * sk / rij;
+    T ck = -k * si / rkj;
+
+    return std::make_tuple(ci, ck, epot);
+
+    /* That was 8 flops */
+}
+
+//! Cross bond-bond interaction
+template <class T>
+inline auto threeCenterKernel(T drij, T drkj, const CrossBondBond& crossBondBond)
+{
+    return crossBondBondScalarForce(crossBondBond.forceConstant(), crossBondBond.equilDistanceIJ(), crossBondBond.equilDistanceKJ(), drij, drkj);
+}
+
+/*! \brief kernel to calculate the scalar part for cross bond-angle forces
+ *         for lambda = 0
+ *
+ * \param k force constant
+ * \param r0ij equilibrium distance between particles i & j
+ * \param r0kj equilibrium distance between particles k & j
+ * \param r0ik equilibrium distance between particles i & k
+ * \param rij  input bond length between particles i & j
+ * \param rkj  input bond length between particles k & j
+ * \param rik  input bond length between particles i & k
+ *
+ * \return tuple<atom i force, atom j force, atom k force, potential energy>
+ */
  
-//! Three-center interaction type dispatch
+template <class T>
+inline std::tuple<T, T, T, T> crossBondAngleScalarForce(T k, T r0ij, T r0kj, T r0ik, T rij, T rkj, T rik)
+{
+    T sij = rij - r0ij;
+    T skj = rkj - r0kj;
+    T sik = rik - r0ik;
+
+    T epot = k * sik * (sij + skj);
+
+    T fi = -k * sik / rij;
+    T fj = -k * sik / rkj;
+    T fk = -k * (sij + skj) / rik;
+
+    return std::make_tuple(fi, fj, fk, epot);
+
+    /* That was 13 flops */
+}
+
+//! Cross bond-bond interaction
+template <class T>
+inline auto threeCenterKernel(T drij, T drkj, T drik, const CrossBondAngle& crossBondAngle)
+{
+    return crossBondAngleScalarForce(crossBondAngle.forceConstant(), crossBondAngle.equilDistanceIJ(), crossBondAngle.equilDistanceKJ(), crossBondAngle.equilDistanceIK(), drij, drkj, drik);
+}
  
+//! Quartic Angle
  template <class T>
-inline auto threeCenterKernel(T dr, const DefaultAngle& angle)
+inline auto threeCenterKernel(T dr, const QuarticAngle& angle)
  {
-    return harmonicScalarForce(angle.forceConstant(), angle.equilDistance(), dr);
+    T dt = dr - angle.equilConstant();       /*  1          */
+
+    T force  = 0;
+    T energy = angle.forceConstant(0);
+    T dtp  = 1.0;
+    for (auto j = 1; j <= 4; j++)
+    { /* 24     */
+        T c = angle.forceConstant(j);
+        force -= j * c * dtp;               /*  3          */
+        dtp *= dt;                          /*  1          */
+        energy += c * dtp;                  /*  2          */
+    }
+
+    /* TOTAL 25 */
+    return std::make_tuple(force, energy);
  }
  
+//! \brief Restricted Angle potential. Returns scalar force and energy
+template <class T>
+inline auto threeCenterKernel(T theta, const RestrictedAngle& angle)
+{
+    T costheta = std::cos(theta);
+    auto [force, ePot] = harmonicScalarForce(angle.forceConstant(), angle.equilConstant(), costheta);
+
+    // The above kernel call effectively computes the derivative of the potential with respect to
+    // cos(theta). However, we need the derivative with respect to theta.
+    // This introduces the extra (cos(theta)*cos(eqAngle) - 1)/(sin(theta)^3 factor for the force
+    // The call also computes the potential energy without the sin(theta)^-2 factor
+
+    T sintheta2 = (1 - costheta*costheta);
+    T sintheta  = std::sqrt(sintheta2);
+    force *= (costheta*angle.equilConstant() - 1)/(sintheta2*sintheta);
+    ePot /= sintheta2;
+    return std::make_tuple(force, ePot);
+}
  
  //! \brief Computes and returns the proper dihedral force
  template <class T>
  inline auto fourCenterKernel(T phi, const ProperDihedral& properDihedral)
  {
-    const T deltaPhi = properDihedral.multiplicity() * phi - properDihedral.equilDistance();
-    const T force = -properDihedral.forceConstant() * properDihedral.multiplicity() * std::sin(deltaPhi);
-    const T ePot = properDihedral.forceConstant() * ( 1 + std::cos(deltaPhi) );
+    T deltaPhi = properDihedral.multiplicity() * phi - properDihedral.equilDistance();
+    T force = -properDihedral.forceConstant() * properDihedral.multiplicity() * std::sin(deltaPhi);
+    T ePot = properDihedral.forceConstant() * ( 1 + std::cos(deltaPhi) );
      return std::make_tuple(force, ePot);
  }
  
  
  //! \brief Ensure that a geometric quantity lies in (-pi, pi)
-static inline void makeAnglePeriodic(real& angle)
+template<class T>
+inline void makeAnglePeriodic(T& angle)
  {
      if (angle >= M_PI)
      {
@@ -426,15 +621,79 @@ static inline void makeAnglePeriodic(real& angle)
      }
  }
  
-//! \brief Computes and returns a dihedral phi angle
-static inline real dihedralPhi(rvec dxIJ, rvec dxKJ, rvec dxKL, rvec m, rvec n)
+/*! \brief calculate the cosine of the angle between aInput and bInput
+ *
+ * \tparam T       float or double
+ * \param aInput   aInput 3D vector
+ * \param bInput   another 3D vector
+ * \return         the cosine of the angle between aInput and bInput
+ *
+ *                       ax*bx + ay*by + az*bz
+ * cos(aInput,bInput) = -----------------------, where aInput = (ax, ay, az)
+ *                      ||aInput|| * ||bInput||
+ */
+template<class T>
+inline T basicVectorCosAngle(gmx::BasicVector<T> aInput, gmx::BasicVector<T> bInput)
  {
-    cprod(dxIJ, dxKJ, m);
-    cprod(dxKJ, dxKL, n);
-    real phi  = gmx_angle(m, n);
-    real ipr  = iprod(dxIJ, n);
-    real sign = (ipr < 0.0) ? -1.0 : 1.0;
-    phi       = sign * phi;
+    gmx::BasicVector<double> a_double(aInput[0], aInput[1], aInput[2]);
+    gmx::BasicVector<double> b_double(bInput[0], bInput[1], bInput[2]);
+
+    double numerator     = dot(a_double, b_double);
+    double denominatorSq = dot(a_double, a_double) * dot(b_double, b_double);
+
+    T cosval = (denominatorSq > 0) ? static_cast<T>(numerator * gmx::invsqrt(denominatorSq)) : 1;
+    cosval   = std::min(cosval, T(1.0));
+
+    /* 25 TOTAL */
+    return std::max(cosval, T(-1.0));
+}
+
+/*! \brief compute the angle between vectors a and b
+ *
+ * \tparam T    scalar type (float, double, or similar)
+ * \param a     a 3D vector
+ * \param b     another 3D vector
+ * \return      the angle between a and b
+ *
+ * This routine calculates the angle between a & b without any loss of accuracy close to 0/PI.
+ *
+ * Note: This function is not (yet) implemented for the C++ replacement of the
+ * deprecated rvec and dvec.
+ */
+template<class T>
+inline T basicVectorAngle(gmx::BasicVector<T> a, gmx::BasicVector<T> b)
+{
+    gmx::BasicVector<T> w = cross(a, b);
+
+    T wlen = norm(w);
+    T s    = dot(a, b);
+
+    return std::atan2(wlen, s);
+}
+
+/*! \brief Computes the dihedral phi angle and two cross products
+ *
+ * \tparam T        scalar type (float or double, or similar)
+ * \param[in] dxIJ
+ * \param[in] dxKJ
+ * \param[in] dxKL
+ * \param[out] m    output for \p dxIJ x \p dxKJ
+ * \param[out] n    output for \p dxKJ x \p dxKL
+ * \return          the angle between m and n
+ */
+template<class T>
+inline T dihedralPhi(gmx::BasicVector<T> dxIJ,
+                     gmx::BasicVector<T> dxKJ,
+                     gmx::BasicVector<T> dxKL,
+                     gmx::BasicVector<T>* m,
+                     gmx::BasicVector<T>* n)
+{
+    *m = cross(dxIJ, dxKJ);
+    *n = cross(dxKJ, dxKL);
+    T phi  = basicVectorAngle(*m, *n);
+    T ipr  = dot(dxIJ, *n);
+    T sign = (ipr < 0.0) ? -1.0 : 1.0;
+    phi    = sign * phi;
      return phi;
  }
  
@@ -442,7 +701,7 @@ static inline real dihedralPhi(rvec dxIJ, rvec dxKJ, rvec dxKL, rvec m, rvec n)
  template <class T>
  inline auto fourCenterKernel(T phi, const ImproperDihedral& improperDihedral)
  {
-    T deltaPhi = phi - improperDihedral.equilDistance();
+    T deltaPhi = phi - improperDihedral.equilConstant();
      /* deltaPhi cannot be outside (-pi,pi) */
      makeAnglePeriodic(deltaPhi);
      const T force = -improperDihedral.forceConstant()  * deltaPhi;
@@ -474,114 +733,172 @@ inline auto fourCenterKernel(T phi, const RyckaertBellemanDihedral& ryckaertBell
  
  //! Two-center category common
  
-/*! \brief Spreads and accumulates the bonded forces to the two atoms and adds the virial contribution when needed
+//! \brief add shift forces, if requested (static compiler decision)
+template<class T, class ShiftForce>
+inline void
+addShiftForce(const gmx::BasicVector<T>& interactionForce, ShiftForce* shiftForce)
+{
+    *shiftForce += interactionForce;
+}
+
+//! \brief this will be called if shift forces are not computed (and removed by the compiler)
+template<class T>
+inline void addShiftForce([[maybe_unused]] const gmx::BasicVector<T>& fij,
+                          [[maybe_unused]] std::nullptr_t*)
+{
+}
+
+/*! \brief Spreads and accumulates the forces between two atoms and adds the virial contribution when needed
   *
- * \p shiftIndex is used as the periodic shift.
+ * \tparam T         The type of vector, e.g. float, double, etc
+ * \param force      The Force
+ * \param dx         Distance between centers
+ * \param force_i    Force on center i
+ * \param force_j    Force on center j
+ * \param shf_ik     Shift force between centers i and j
+ * \param shf_c      Shift force at the "center" of the two center interaction
   */
-template <class T>
-inline void spreadTwoCenterForces(const T bondForce,
-                                  const gmx::RVec& dx,
-                                  gmx::RVec* force_i,
-                                  gmx::RVec* force_j)
+template <class T, class ShiftForce>
+inline void spreadTwoCenterForces(const T force,
+                                  const gmx::BasicVector<T>& dx,
+                                  gmx::BasicVector<T>*       force_i,
+                                  gmx::BasicVector<T>*       force_j,
+                                  ShiftForce*                shf_ij,
+                                  ShiftForce*                shf_c)
  {
-    for (int m = 0; m < dimSize; m++) /*  15          */
-    {
-        const T fij = bondForce * dx[m];
-        (*force_i)[m] += fij;
-        (*force_j)[m] -= fij;
-    }
+    gmx::BasicVector<T> fij = force * dx;
+    *force_i += fij;
+    *force_j -= fij;
+
+    addShiftForce(fij, shf_ij);
+    addShiftForce(T(-1.0)*fij, shf_c);
+    /* 15 Total */
  }
  
  //! Three-center category common
  
  /*! \brief spread force to 3 centers based on scalar force and angle
   *
- * @tparam T
- * @param cos_theta
- * @param force
- * @param r_ij
- * @param r_kj
- * @param force_i
- * @param force_j
- * @param force_k
+ * \tparam T         The type of vector, e.g. float, double, etc
+ * \param cos_theta  Angle between two vectors
+ * \param force      The Force
+ * \param dxIJ       Distance between centers i and j
+ * \param dxJK       Distance between centers j and k
+ * \param force_i    Force on center i
+ * \param force_j    Force on center j
+ * \param force_k    Force on center k
+ * \param shf_ik     Shift force between centers i and j
+ * \param shf_kj     Shift force between centers k and j
+ * \param shf_c      Shift force at the center subtending the angle
   */
-template <class T>
-inline void spreadThreeCenterForces(T cos_theta,
-                             T force,
-                             const gmx::RVec& r_ij,
-                             const gmx::RVec& r_kj,
-                             gmx::RVec* force_i,
-                             gmx::RVec* force_j,
-                             gmx::RVec* force_k)
+template <class T, class ShiftForce>
+inline void spreadThreeCenterForces(T                          cos_theta,
+                                    T                          force,
+                                    const gmx::BasicVector<T>& dxIJ,
+                                    const gmx::BasicVector<T>& dxKJ,
+                                    gmx::BasicVector<T>*       force_i,
+                                    gmx::BasicVector<T>*       force_j,
+                                    gmx::BasicVector<T>*       force_k,
+                                    ShiftForce*                shf_ij,
+                                    ShiftForce*                shf_kj,
+                                    ShiftForce*                shf_c)
  {
      T cos_theta2 = cos_theta * cos_theta;
-    if (cos_theta2 < 1)
+    if (cos_theta2 < 1)                              /*   1            */
      {
          T st    = force / std::sqrt(1 - cos_theta2); /*  12            */
-        T sth   = st * cos_theta;                      /*   1          */
-        T nrij2 = dot(r_ij, r_ij);                   /*   5            */
-        T nrkj2 = dot(r_kj, r_kj);                   /*   5            */
-
-        T nrij_1 = 1.0 / std::sqrt(nrij2); /*  10              */
-        T nrkj_1 = 1.0 / std::sqrt(nrkj2); /*  10              */
-
-        T cik = st * nrij_1 * nrkj_1;  /*   2          */
-        T cii = sth * nrij_1 * nrij_1; /*   2          */
-        T ckk = sth * nrkj_1 * nrkj_1; /*   2          */
-
-        gmx::RVec f_i{0, 0, 0};
-        gmx::RVec f_j{0, 0, 0};
-        gmx::RVec f_k{0, 0, 0};
-        for (int m = 0; m < dimSize; m++)
-        { /*  39               */
-            f_i[m] = -(cik * r_kj[m] - cii * r_ij[m]);
-            f_k[m] = -(cik * r_ij[m] - ckk * r_kj[m]);
-            f_j[m] = -f_i[m] - f_k[m];
-            (*force_i)[m] += f_i[m];
-            (*force_j)[m] += f_j[m];
-            (*force_k)[m] += f_k[m];
-        }
-    } /* 161 TOTAL     */
+        T sth   = st * cos_theta;                    /*   1            */
+        T nrij2 = dot(dxIJ, dxIJ);                   /*   5            */
+        T nrkj2 = dot(dxKJ, dxKJ);                   /*   5            */
+
+        T cik = st / std::sqrt(nrij2 * nrkj2);       /*  11            */
+        T cii = sth / nrij2;                         /*   1            */
+        T ckk = sth / nrkj2;                         /*   1            */
+
+        /*  33 */
+        gmx::BasicVector<T> f_i = cii * dxIJ - cik * dxKJ;
+        gmx::BasicVector<T> f_k = ckk * dxKJ - cik * dxIJ;
+        gmx::BasicVector<T> f_j = T(-1.0) * (f_i + f_k);
+        *force_i += f_i;
+        *force_j += f_j;
+        *force_k += f_k;
+
+        addShiftForce(f_i, shf_ij);
+        addShiftForce(f_j, shf_c);
+        addShiftForce(f_k, shf_kj);
+
+    } /* 70 TOTAL      */
  }
  
  //! Four-center category common
-template <class T>
-inline void spreadFourCenterForces(T force, rvec dxIJ, rvec dxJK, rvec dxKL, rvec m, rvec n,
-                            gmx::RVec* force_i,
-                            gmx::RVec* force_j,
-                            gmx::RVec* force_k,
-                            gmx::RVec* force_l)
-{
-    rvec f_i, f_j, f_k, f_l;
-    rvec uvec, vvec, svec;
-    T iprm  = iprod(m, m);       /*  5    */
-    T iprn  = iprod(n, n);       /*  5 */
-    T nrkj2 = iprod(dxJK, dxJK); /*  5 */
-    T toler = nrkj2 * GMX_REAL_EPS;
-    if ((iprm > toler) && (iprn > toler))
+
+/*! \brief spread force to 4 centers
+ *
+ * \tparam T         The type of vector, e.g. float, double, etc
+ * \param dxIJ       Distance between centers i and j
+ * \param dxKJ       Distance between centers j and k
+ * \param dxKL       Distance between centers k and l
+ * \param m          Cross product of \p dxIJ x \p dxKJ
+ * \param m          Cross product of \p dxKJ x \p dxKL
+ * \param force_i    Force on center i
+ * \param force_j    Force on center j
+ * \param force_k    Force on center k
+ * \param force_k    Force on center l
+ * \param shf_ik     Shift force between centers i and j
+ * \param shf_kj     Shift force between centers k and j
+ * \param shf_lj     Shift force between centers k and j
+ * \param shf_c      Shift force at the center subtending the angle
+ */
+template <class T, class ShiftForce>
+inline void spreadFourCenterForces(T force,
+                                   const gmx::BasicVector<T>& dxIJ,
+                                   const gmx::BasicVector<T>& dxJK,
+                                   const gmx::BasicVector<T>& dxKL,
+                                   const gmx::BasicVector<T>& m,
+                                   const gmx::BasicVector<T>& n,
+                                   gmx::BasicVector<T>* force_i,
+                                   gmx::BasicVector<T>* force_j,
+                                   gmx::BasicVector<T>* force_k,
+                                   gmx::BasicVector<T>* force_l,
+                                   ShiftForce* shf_ij,
+                                   ShiftForce* shf_kj,
+                                   ShiftForce* shf_lj,
+                                   ShiftForce* shf_c)
+{
+    T norm2_m = dot(m, m);                             /* 5 */
+    T norm2_n = dot(n, n);                             /* 5 */
+    T norm2_jk = dot(dxJK, dxJK);                      /* 5 */
+    T toler = norm2_jk * GMX_REAL_EPS;
+    if ((norm2_m > toler) && (norm2_n > toler))
      {
-        T nrkj_1 = gmx::invsqrt(nrkj2);  /* 10 */
-        T nrkj_2 = nrkj_1 * nrkj_1;      /*  1 */
-        T nrkj   = nrkj2 * nrkj_1;       /*  1 */
-        T a      = -force * nrkj / iprm; /* 11 */
-        svmul(a, m, f_i);              /*  3   */
-        T b = force * nrkj / iprn;       /* 11 */
-        svmul(b, n, f_l);              /*  3  */
-        T p = iprod(dxIJ, dxJK);         /*  5 */
-        p *= nrkj_2;                   /*  1   */
-        T q = iprod(dxKL, dxJK);         /*  5 */
-        q *= nrkj_2;                   /*  1   */
-        svmul(p, f_i, uvec);           /*  3   */
-        svmul(q, f_l, vvec);           /*  3   */
-        rvec_sub(uvec, vvec, svec);    /*  3   */
-        rvec_sub(f_i, svec, f_j);      /*  3   */
-        rvec_add(f_l, svec, f_k);      /*  3   */
-        rvec_inc(force_i->as_vec(), f_i);           /*  3      */
-        rvec_dec(force_j->as_vec(), f_j);           /*  3      */
-        rvec_dec(force_k->as_vec(), f_k);           /*  3      */
-        rvec_inc(force_l->as_vec(), f_l);           /*  3      */
+        T rcp_norm2_jk = 1.0f / norm2_jk;              /* 1 */
+        T norm_jk = std::sqrt(norm2_jk);               /* 10 */
+
+        T a = -force * norm_jk / norm2_m;              /* 11 */
+        gmx::BasicVector<T> f_i = a * m;               /* 3 */
+
+        T b = force * norm_jk / norm2_n;               /* 11 */
+        gmx::BasicVector<T> f_l = b * n;               /* 3 */
+
+        T p = rcp_norm2_jk * dot(dxIJ, dxJK);          /* 6 */
+        T q = rcp_norm2_jk * dot(dxKL, dxJK);          /* 6 */
+        gmx::BasicVector<T> svec = p * f_i - q * f_l;  /* 9 */
+
+        gmx::BasicVector<T> f_j = svec - f_i;          /* 3 */
+        gmx::BasicVector<T> f_k = T(-1.0)*svec - f_l;  /* 6 */
+
+        *force_i += f_i;                               /* 3 */
+        *force_j += f_j;                               /* 3 */
+        *force_k += f_k;                               /* 3 */
+        *force_l += f_l;                               /* 3 */
+
+        addShiftForce(f_i, shf_ij);
+        addShiftForce(f_j, shf_c);
+        addShiftForce(f_k, shf_kj);
+        addShiftForce(f_l, shf_lj);
      }
  }
  
  } // namespace nblib
+
  #endif // NBLIB_LISTEDFORCES_KERNELS_HPP