namd/doxygen/ComputeBondedCUDAKernel_8h_source.html

 #ifndef COMPUTEBONDEDCUDAKERNEL_H
 #define COMPUTEBONDEDCUDAKERNEL_H
 #include "CudaUtils.h"
 #include "TupleTypesCUDA.h"
 #include "CudaNonbondedTables.h"

 #if defined(NAMD_CUDA) || defined(NAMD_HIP)

 #define FORCE_TYPE double

 #define USE_STRIDED_FORCE

 #ifndef USE_STRIDED_FORCE
 #error "Non-USE_STRIDED_FORCE not implemented"
 #endif

 #define WRITE_FULL_VIRIALS

 #define USE_BONDED_FORCE_ATOMIC_STORE

 class ComputeBondedCUDAKernel {
 public:

   // Enumeration for energies_virials[]
   enum {energyIndex_BOND=0, energyIndex_ANGLE, energyIndex_DIHEDRAL, energyIndex_IMPROPER,
     energyIndex_ELECT, energyIndex_LJ, energyIndex_ELECT_SLOW, energyIndex_CROSSTERM,
     energyIndex_BOND_F, energyIndex_BOND_TI_1, energyIndex_BOND_TI_2, // Alchemical, bond energy
     energyIndex_ANGLE_F, energyIndex_ANGLE_TI_1, energyIndex_ANGLE_TI_2, // Alchemical, angle energy
     energyIndex_DIHEDRAL_F, energyIndex_DIHEDRAL_TI_1, energyIndex_DIHEDRAL_TI_2, // Alchemical, dihedral energy
     energyIndex_IMPROPER_F, energyIndex_IMPROPER_TI_1, energyIndex_IMPROPER_TI_2, // Alchemical, improper energy
     energyIndex_ELECT_F, energyIndex_ELECT_TI_1, energyIndex_ELECT_TI_2,
     energyIndex_LJ_F, energyIndex_LJ_TI_1, energyIndex_LJ_TI_2,
     energyIndex_ELECT_SLOW_F, energyIndex_ELECT_SLOW_TI_1, energyIndex_ELECT_SLOW_TI_2,
     energyIndex_CROSSTERM_F, energyIndex_CROSSTERM_TI_1, energyIndex_CROSSTERM_TI_2, // Alchemical, cross-term energy
     normalVirialIndex_XX, normalVirialIndex_XY, normalVirialIndex_XZ,
     normalVirialIndex_YX, normalVirialIndex_YY, normalVirialIndex_YZ,
     normalVirialIndex_ZX, normalVirialIndex_ZY, normalVirialIndex_ZZ,
     nbondVirialIndex_XX, nbondVirialIndex_XY, nbondVirialIndex_XZ,
     nbondVirialIndex_YX, nbondVirialIndex_YY, nbondVirialIndex_YZ,
     nbondVirialIndex_ZX, nbondVirialIndex_ZY, nbondVirialIndex_ZZ,
     slowVirialIndex_XX, slowVirialIndex_XY, slowVirialIndex_XZ,
     slowVirialIndex_YX, slowVirialIndex_YY, slowVirialIndex_YZ,
     slowVirialIndex_ZX, slowVirialIndex_ZY, slowVirialIndex_ZZ,
     amdDiheVirialIndex_XX, amdDiheVirialIndex_XY, amdDiheVirialIndex_XZ,
     amdDiheVirialIndex_YX, amdDiheVirialIndex_YY, amdDiheVirialIndex_YZ,
     amdDiheVirialIndex_ZX, amdDiheVirialIndex_ZY, amdDiheVirialIndex_ZZ,
     energies_virials_SIZE};

   template <typename T>
   struct BondedVirial {
 #ifdef WRITE_FULL_VIRIALS
     T xx;
     T xy;
     T xz;
     T yx;
     T yy;
     T yz;
     T zx;
     T zy;
     T zz;
 #else
 #error "non-WRITE_FULL_VIRIALS not implemented yet"
     union {
       double sforce_dp[27][3];
       long long int sforce_fp[27][3];
     };
 #endif
   };
   double *getForces(){
     return forces;
   }
 private:
   const int deviceID;
   CudaNonbondedTables& cudaNonbondedTables;

   // This stores all bonds, angles, dihedrals, and impropers in a single
   // contigious memory array.
   char* tupleData;
   size_t tupleDataSize;

   // ---------------------------------------------------------------------------------
   // NOTE: bonds, angles, dihedrals, impropers, etc. - pointers below are
   // computed pointers pointing to tupleData -array
   // DO NOT DEALLOCATE THESE!
   int numBonds;
   CudaBond* bonds;

   int numAngles;
   CudaAngle* angles;

   int numDihedrals;
   CudaDihedral* dihedrals;

   int numImpropers;
   CudaDihedral* impropers;

   int numModifiedExclusions;
   CudaExclusion* modifiedExclusions;

   int numExclusions;
   CudaExclusion* exclusions;

   int numCrossterms;
   CudaCrossterm* crossterms;
   // ---------------------------------------------------------------------------------

   // Device memory for coordinates
   float4* xyzq;
   size_t xyzqSize;

   FORCE_TYPE* forceList;
   int* forceListCounter;
   int* forceListStarts;
   int* forceListNexts;
   int forceListSize;
   int forceListStartsSize;
   int forceListNextsSize;

   // Device memory for forces:
   // [normal, nbond, slow]
   FORCE_TYPE* forces;
   size_t forcesSize;

   CudaBondValue* bondValues;
   CudaAngleValue* angleValues;
   CudaDihedralValue* dihedralValues;
   CudaDihedralValue* improperValues;
   CudaCrosstermValue* crosstermValues;

   // Accumulated energy values for every bonded type
   double* energies_virials;

   // Alchemical flags
   CudaAlchFlags       alchFlags;

 public:

   ComputeBondedCUDAKernel(int deviceID, CudaNonbondedTables& cudaNonbondedTables);
   ~ComputeBondedCUDAKernel();

   static constexpr float kTupleOveralloc = 1.4f;
   static int warpAlign(const int n) {return ((n + WARPSIZE - 1)/WARPSIZE)*WARPSIZE;}

   void update(
     const int numBondsIn,
     const int numAnglesIn,
     const int numDihedralsIn,
     const int numImpropersIn,
     const int numModifiedExclusionsIn,
     const int numExclusionsIn,
     const int numCrosstermsIn,
     const char* h_tupleData,
     cudaStream_t stream);

   void setTupleCounts(
     const TupleCounts count);
   size_t reallocateTupleBuffer(
     const TupleCounts countIn,
     cudaStream_t stream);
   void updateAtomBuffer(
     const int atomStorageSize,
     cudaStream_t stream);

   TupleCounts getTupleCounts();
   TupleData getData();

   void setupBondValues(int numBondValues, CudaBondValue* h_bondValues);
   void setupAngleValues(int numAngleValues, CudaAngleValue* h_angleValues);
   void setupDihedralValues(int numDihedralValues, CudaDihedralValue* h_dihedralValues);
   void setupImproperValues(int numImproperValues, CudaDihedralValue* h_improperValues);
   void setupCrosstermValues(int numCrosstermValues, CudaCrosstermValue* h_crosstermValues);

   int getForceStride(const int atomStorageSize);
   int getForceSize(const int atomStorageSize);
   int getAllForceSize(const int atomStorageSize, const bool doSlow);
   float4* getAtomBuffer(){ return xyzq;}

   void bondedForce(
     const double scale14, const int atomStorageSize,
     const bool doEnergy, const bool doVirial, const bool doSlow,
     const bool doTable,
     const float3 lata, const float3 latb, const float3 latc,
     const float cutoff2, const float r2_delta, const int r2_delta_expc,
     const CudaNBConstants nbConstants,
     const float4* h_xyzq, double* h_forces,
     double *h_energies, bool atomsChanged,
     bool CUDASOAintegratorOn, bool useDeviceMigration,
     cudaStream_t stream);

   void updateCudaAlchFlags(const CudaAlchFlags& h_cudaAlchFlags);
   void updateCudaAlchParameters(const CudaAlchParameters* h_cudaAlchParameters, cudaStream_t stream);
   void updateCudaAlchLambdas(const CudaAlchLambdas* h_cudaAlchLambdas, cudaStream_t stream);
 };

 #endif

 #endif // COMPUTEBONDEDCUDAKERNEL_H
ComputeBondedCUDAKernel::amdDiheVirialIndex_ZX
Definition: ComputeBondedCUDAKernel.h:46

CudaBond
Definition: TupleTypesCUDA.h:17

CudaUtils.h

ComputeBondedCUDAKernel::energyIndex_LJ_F
Definition: ComputeBondedCUDAKernel.h:32

ComputeBondedCUDAKernel::normalVirialIndex_YY
Definition: ComputeBondedCUDAKernel.h:36

CudaAlchLambdas
Definition: TupleTypesCUDA.h:167

ComputeBondedCUDAKernel::amdDiheVirialIndex_YZ
Definition: ComputeBondedCUDAKernel.h:45

ComputeBondedCUDAKernel::getAtomBuffer
float4 * getAtomBuffer()
Definition: ComputeBondedCUDAKernel.h:176

ComputeBondedCUDAKernel::normalVirialIndex_XZ
Definition: ComputeBondedCUDAKernel.h:35

ComputeBondedCUDAKernel::~ComputeBondedCUDAKernel
~ComputeBondedCUDAKernel()

ComputeBondedCUDAKernel::amdDiheVirialIndex_ZZ
Definition: ComputeBondedCUDAKernel.h:46

ComputeBondedCUDAKernel::energyIndex_ELECT_SLOW_TI_2
Definition: ComputeBondedCUDAKernel.h:33

ComputeBondedCUDAKernel::warpAlign
static int warpAlign(const int n)
Definition: ComputeBondedCUDAKernel.h:142

ComputeBondedCUDAKernel::slowVirialIndex_ZX
Definition: ComputeBondedCUDAKernel.h:43

ComputeBondedCUDAKernel::BondedVirial::xy
T xy
Definition: ComputeBondedCUDAKernel.h:53

ComputeBondedCUDAKernel::energyIndex_DIHEDRAL_TI_1
Definition: ComputeBondedCUDAKernel.h:29

ComputeBondedCUDAKernel::energyIndex_LJ_TI_1
Definition: ComputeBondedCUDAKernel.h:32

ComputeBondedCUDAKernel::energyIndex_ELECT_SLOW_F
Definition: ComputeBondedCUDAKernel.h:33

ComputeBondedCUDAKernel::getForceStride
int getForceStride(const int atomStorageSize)

ComputeBondedCUDAKernel::nbondVirialIndex_ZY
Definition: ComputeBondedCUDAKernel.h:40

ComputeBondedCUDAKernel::normalVirialIndex_YX
Definition: ComputeBondedCUDAKernel.h:36

ComputeBondedCUDAKernel::updateCudaAlchParameters
void updateCudaAlchParameters(const CudaAlchParameters *h_cudaAlchParameters, cudaStream_t stream)

ComputeBondedCUDAKernel::getAllForceSize
int getAllForceSize(const int atomStorageSize, const bool doSlow)

ComputeBondedCUDAKernel::energyIndex_ELECT_TI_1
Definition: ComputeBondedCUDAKernel.h:31

CudaDihedralValue
Definition: TupleTypesCUDA.h:127

ComputeBondedCUDAKernel::getTupleCounts
TupleCounts getTupleCounts()

ComputeBondedCUDAKernel::slowVirialIndex_XY
Definition: ComputeBondedCUDAKernel.h:41

CudaExclusion
Definition: TupleTypesCUDA.h:76

ComputeBondedCUDAKernel::amdDiheVirialIndex_YY
Definition: ComputeBondedCUDAKernel.h:45

ComputeBondedCUDAKernel::energyIndex_IMPROPER_TI_1
Definition: ComputeBondedCUDAKernel.h:30

ComputeBondedCUDAKernel::amdDiheVirialIndex_XX
Definition: ComputeBondedCUDAKernel.h:44

ComputeBondedCUDAKernel::nbondVirialIndex_ZX
Definition: ComputeBondedCUDAKernel.h:40

ComputeBondedCUDAKernel::energyIndex_DIHEDRAL_TI_2
Definition: ComputeBondedCUDAKernel.h:29

ComputeBondedCUDAKernel::nbondVirialIndex_YZ
Definition: ComputeBondedCUDAKernel.h:39

WARPSIZE
#define WARPSIZE
Definition: CudaUtils.h:17

ComputeBondedCUDAKernel::BondedVirial::yy
T yy
Definition: ComputeBondedCUDAKernel.h:56

ComputeBondedCUDAKernel::slowVirialIndex_YY
Definition: ComputeBondedCUDAKernel.h:42

ComputeBondedCUDAKernel::setupAngleValues
void setupAngleValues(int numAngleValues, CudaAngleValue *h_angleValues)

ComputeBondedCUDAKernel::energyIndex_CROSSTERM_F
Definition: ComputeBondedCUDAKernel.h:34

TupleCounts
Definition: TupleTypesCUDA.h:186

ComputeBondedCUDAKernel::energyIndex_LJ_TI_2
Definition: ComputeBondedCUDAKernel.h:32

ComputeBondedCUDAKernel::energyIndex_BOND
Definition: ComputeBondedCUDAKernel.h:25

ComputeBondedCUDAKernel::energyIndex_BOND_TI_1
Definition: ComputeBondedCUDAKernel.h:27

ComputeBondedCUDAKernel::slowVirialIndex_XZ
Definition: ComputeBondedCUDAKernel.h:41

ComputeBondedCUDAKernel::energyIndex_IMPROPER_F
Definition: ComputeBondedCUDAKernel.h:30

ComputeBondedCUDAKernel::energyIndex_ELECT_F
Definition: ComputeBondedCUDAKernel.h:31

TupleTypesCUDA.h

ComputeBondedCUDAKernel::normalVirialIndex_ZZ
Definition: ComputeBondedCUDAKernel.h:37

CudaNBConstants
Definition: CudaUtils.h:593

CudaBondValue
Definition: TupleTypesCUDA.h:113

ComputeBondedCUDAKernel::setupBondValues
void setupBondValues(int numBondValues, CudaBondValue *h_bondValues)

ComputeBondedCUDAKernel::getForceSize
int getForceSize(const int atomStorageSize)

ComputeBondedCUDAKernel::slowVirialIndex_YX
Definition: ComputeBondedCUDAKernel.h:42

ComputeBondedCUDAKernel::BondedVirial::zx
T zx
Definition: ComputeBondedCUDAKernel.h:58

ComputeBondedCUDAKernel::normalVirialIndex_ZX
Definition: ComputeBondedCUDAKernel.h:37

ComputeBondedCUDAKernel::energyIndex_ANGLE_TI_1
Definition: ComputeBondedCUDAKernel.h:28

ComputeBondedCUDAKernel::setupImproperValues
void setupImproperValues(int numImproperValues, CudaDihedralValue *h_improperValues)

ComputeBondedCUDAKernel::BondedVirial::yx
T yx
Definition: ComputeBondedCUDAKernel.h:55

ComputeBondedCUDAKernel::slowVirialIndex_YZ
Definition: ComputeBondedCUDAKernel.h:42

ComputeBondedCUDAKernel::energyIndex_BOND_TI_2
Definition: ComputeBondedCUDAKernel.h:27

CudaAngle
Definition: TupleTypesCUDA.h:37

ComputeBondedCUDAKernel::energies_virials_SIZE
Definition: ComputeBondedCUDAKernel.h:47

ComputeBondedCUDAKernel::energyIndex_CROSSTERM
Definition: ComputeBondedCUDAKernel.h:26

TupleData
Definition: TupleTypesCUDA.h:239

ComputeBondedCUDAKernel::setupCrosstermValues
void setupCrosstermValues(int numCrosstermValues, CudaCrosstermValue *h_crosstermValues)

CudaAlchParameters
Definition: TupleTypesCUDA.h:159

ComputeBondedCUDAKernel::energyIndex_ELECT_TI_2
Definition: ComputeBondedCUDAKernel.h:31

ComputeBondedCUDAKernel::energyIndex_ANGLE
Definition: ComputeBondedCUDAKernel.h:25

CudaNonbondedTables
Definition: CudaNonbondedTables.h:16

ComputeBondedCUDAKernel::nbondVirialIndex_XZ
Definition: ComputeBondedCUDAKernel.h:38

ComputeBondedCUDAKernel::BondedVirial::zy
T zy
Definition: ComputeBondedCUDAKernel.h:59

ComputeBondedCUDAKernel::getData
TupleData getData()

ComputeBondedCUDAKernel::energyIndex_CROSSTERM_TI_1
Definition: ComputeBondedCUDAKernel.h:34

ComputeBondedCUDAKernel::slowVirialIndex_XX
Definition: ComputeBondedCUDAKernel.h:41

ComputeBondedCUDAKernel::BondedVirial::xx
T xx
Definition: ComputeBondedCUDAKernel.h:52

FORCE_TYPE
#define FORCE_TYPE
Definition: ComputeBondedCUDAKernel.h:9

ComputeBondedCUDAKernel::energyIndex_ELECT_SLOW_TI_1
Definition: ComputeBondedCUDAKernel.h:33

CudaCrossterm
Definition: TupleTypesCUDA.h:92

ComputeBondedCUDAKernel::amdDiheVirialIndex_XY
Definition: ComputeBondedCUDAKernel.h:44

ComputeBondedCUDAKernel::bondedForce
void bondedForce(const double scale14, const int atomStorageSize, const bool doEnergy, const bool doVirial, const bool doSlow, const bool doTable, const float3 lata, const float3 latb, const float3 latc, const float cutoff2, const float r2_delta, const int r2_delta_expc, const CudaNBConstants nbConstants, const float4 *h_xyzq, double *h_forces, double *h_energies, bool atomsChanged, bool CUDASOAintegratorOn, bool useDeviceMigration, cudaStream_t stream)

ComputeBondedCUDAKernel::normalVirialIndex_YZ
Definition: ComputeBondedCUDAKernel.h:36

ComputeBondedCUDAKernel::BondedVirial::xz
T xz
Definition: ComputeBondedCUDAKernel.h:54

ComputeBondedCUDAKernel::nbondVirialIndex_XY
Definition: ComputeBondedCUDAKernel.h:38

ComputeBondedCUDAKernel::nbondVirialIndex_YX
Definition: ComputeBondedCUDAKernel.h:39

ComputeBondedCUDAKernel::normalVirialIndex_XX
Definition: ComputeBondedCUDAKernel.h:35

CudaCrosstermValue
Definition: TupleTypesCUDA.h:135

ComputeBondedCUDAKernel::energyIndex_IMPROPER_TI_2
Definition: ComputeBondedCUDAKernel.h:30

ComputeBondedCUDAKernel::updateCudaAlchFlags
void updateCudaAlchFlags(const CudaAlchFlags &h_cudaAlchFlags)

ComputeBondedCUDAKernel::ComputeBondedCUDAKernel
ComputeBondedCUDAKernel(int deviceID, CudaNonbondedTables &cudaNonbondedTables)

ComputeBondedCUDAKernel::nbondVirialIndex_ZZ
Definition: ComputeBondedCUDAKernel.h:40

CudaDihedral
Definition: TupleTypesCUDA.h:56

ComputeBondedCUDAKernel::setupDihedralValues
void setupDihedralValues(int numDihedralValues, CudaDihedralValue *h_dihedralValues)

ComputeBondedCUDAKernel::energyIndex_ANGLE_F
Definition: ComputeBondedCUDAKernel.h:28

ComputeBondedCUDAKernel::energyIndex_ANGLE_TI_2
Definition: ComputeBondedCUDAKernel.h:28

ComputeBondedCUDAKernel::energyIndex_DIHEDRAL
Definition: ComputeBondedCUDAKernel.h:25

ComputeBondedCUDAKernel::updateCudaAlchLambdas
void updateCudaAlchLambdas(const CudaAlchLambdas *h_cudaAlchLambdas, cudaStream_t stream)

ComputeBondedCUDAKernel::BondedVirial
Definition: ComputeBondedCUDAKernel.h:50

ComputeBondedCUDAKernel::amdDiheVirialIndex_XZ
Definition: ComputeBondedCUDAKernel.h:44

ComputeBondedCUDAKernel
Definition: ComputeBondedCUDAKernel.h:21

CudaAngleValue
Definition: TupleTypesCUDA.h:119

ComputeBondedCUDAKernel::energyIndex_DIHEDRAL_F
Definition: ComputeBondedCUDAKernel.h:29

ComputeBondedCUDAKernel::energyIndex_ELECT
Definition: ComputeBondedCUDAKernel.h:26

ComputeBondedCUDAKernel::energyIndex_BOND_F
Definition: ComputeBondedCUDAKernel.h:27

CudaNonbondedTables.h

ComputeBondedCUDAKernel::nbondVirialIndex_XX
Definition: ComputeBondedCUDAKernel.h:38

ComputeBondedCUDAKernel::normalVirialIndex_ZY
Definition: ComputeBondedCUDAKernel.h:37

ComputeBondedCUDAKernel::slowVirialIndex_ZY
Definition: ComputeBondedCUDAKernel.h:43

ComputeBondedCUDAKernel::amdDiheVirialIndex_ZY
Definition: ComputeBondedCUDAKernel.h:46

ComputeBondedCUDAKernel::BondedVirial::yz
T yz
Definition: ComputeBondedCUDAKernel.h:57

ComputeBondedCUDAKernel::setTupleCounts
void setTupleCounts(const TupleCounts count)

ComputeBondedCUDAKernel::kTupleOveralloc
static constexpr float kTupleOveralloc
Definition: ComputeBondedCUDAKernel.h:141

ComputeBondedCUDAKernel::amdDiheVirialIndex_YX
Definition: ComputeBondedCUDAKernel.h:45

ComputeBondedCUDAKernel::nbondVirialIndex_YY
Definition: ComputeBondedCUDAKernel.h:39

ComputeBondedCUDAKernel::energyIndex_CROSSTERM_TI_2
Definition: ComputeBondedCUDAKernel.h:34

ComputeBondedCUDAKernel::reallocateTupleBuffer
size_t reallocateTupleBuffer(const TupleCounts countIn, cudaStream_t stream)

ComputeBondedCUDAKernel::getForces
double * getForces()
Definition: ComputeBondedCUDAKernel.h:69

ComputeBondedCUDAKernel::BondedVirial::zz
T zz
Definition: ComputeBondedCUDAKernel.h:60

ComputeBondedCUDAKernel::slowVirialIndex_ZZ
Definition: ComputeBondedCUDAKernel.h:43

ComputeBondedCUDAKernel::energyIndex_IMPROPER
Definition: ComputeBondedCUDAKernel.h:25

ComputeBondedCUDAKernel::energyIndex_LJ
Definition: ComputeBondedCUDAKernel.h:26

CudaAlchFlags
Definition: TupleTypesCUDA.h:141

ComputeBondedCUDAKernel::updateAtomBuffer
void updateAtomBuffer(const int atomStorageSize, cudaStream_t stream)

ComputeBondedCUDAKernel::normalVirialIndex_XY
Definition: ComputeBondedCUDAKernel.h:35

ComputeBondedCUDAKernel::energyIndex_ELECT_SLOW
Definition: ComputeBondedCUDAKernel.h:26

ComputeBondedCUDAKernel::update
void update(const int numBondsIn, const int numAnglesIn, const int numDihedralsIn, const int numImpropersIn, const int numModifiedExclusionsIn, const int numExclusionsIn, const int numCrosstermsIn, const char *h_tupleData, cudaStream_t stream)