float interpolate_coulomb_force_r(float r, float scale)
{
float normalized = scale * r;
- int index = (int) normalized;
- float fract2 = normalized - index;
- float fract1 = 1.0f - fract2;
+ int index = (int) normalized;
+ float fract2 = normalized - index;
+ float fract1 = 1.0f - fract2;
- return fract1 * tex1Dfetch(coulomb_tab_texref, index)
- + fract2 * tex1Dfetch(coulomb_tab_texref, index + 1);
+ return fract1 * tex1Dfetch(coulomb_tab_texref, index)
+ + fract2 * tex1Dfetch(coulomb_tab_texref, index + 1);
}
#ifdef TEXOBJ_SUPPORTED
float r, float scale)
{
float normalized = scale * r;
- int index = (int) normalized;
- float fract2 = normalized - index;
- float fract1 = 1.0f - fract2;
+ int index = (int) normalized;
+ float fract2 = normalized - index;
+ float fract1 = 1.0f - fract2;
- return fract1 * tex1Dfetch<float>(texobj_coulomb_tab, index) +
- fract2 * tex1Dfetch<float>(texobj_coulomb_tab, index + 1);
+ return fract1 * tex1Dfetch<float>(texobj_coulomb_tab, index) +
+ fract2 * tex1Dfetch<float>(texobj_coulomb_tab, index + 1);
}
#endif
const float FD0 = 1.0f;
float z4;
- float polyFN0,polyFN1,polyFD0,polyFD1;
+ float polyFN0, polyFN1, polyFD0, polyFD1;
z4 = z2*z2;
#pragma unroll 5
for (i = 0; i < 5; i++)
{
- E_lj += __shfl_down(E_lj,sh);
- E_el += __shfl_down(E_el,sh);
- sh += sh;
+ E_lj += __shfl_down(E_lj, sh);
+ E_el += __shfl_down(E_el, sh);
+ sh += sh;
}
/* The first thread in the warp writes the reduced energies */
if (tidx == 0 || tidx == WARP_SIZE)
{
- atomicAdd(e_lj,E_lj);
- atomicAdd(e_el,E_el);
+ atomicAdd(e_lj, E_lj);
+ atomicAdd(e_el, E_el);
}
}
#endif /* __CUDA_ARCH__ */