namd/doxygen/CudaComputeNonbondedKernel_8hip_8h_source.html

 #ifndef CUDACOMPUTENONBONDEDKERNEL_HIP_H
 #define CUDACOMPUTENONBONDEDKERNEL_HIP_H
 #include "CudaUtils.h"
 #include "CudaRecord.h"
 #include "CudaTileListKernel.hip.h"
 #include "CudaNonbondedTables.h"
 #include "HipDefines.h"
 #if defined(NAMD_HIP)


 struct AlchData{
   float scaling;
   float switchdist2;
   float cutoff2;
   float switchfactor;
   float alchVdwShiftCoeff;
   float alchLambda;
   float lambdaUp;
   float lambdaDown;
   float elecLambdaUp;
   float elecLambdaDown;
   float vdwLambdaUp;
   float vdwLambdaDown;

   float lambda2Up;
   float lambda2Down;
   float elecLambda2Up;
   float elecLambda2Down;
   float vdwLambda2Up;
   float vdwLambda2Down;

   float vdwShiftUp;
   float vdwShift2Up;
   float vdwShiftDown;
   float vdwShift2Down;
   bool  alchDecouple;
 };

 class CudaComputeNonbondedKernel {
 private:

   const int deviceID;
   CudaNonbondedTables& cudaNonbondedTables;
   const bool doStreaming;

   // Exclusions
   // JM: Seems like nvcc makes this point to NULL by default but clang doesn't
   //     we rely on it being set to NULL so we can initialize it on setExclusiveByAtom() laters
   int2 *d_exclusionsByAtom = NULL;
   unsigned int* overflowExclusions;
   size_t overflowExclusionsSize;

   int2* exclIndexMaxDiff;
   size_t exclIndexMaxDiffSize;

   // Atom indices
   int* atomIndex;
   size_t atomIndexSize;

   // VdW types
   int* vdwTypes;
   size_t vdwTypesSize;

   unsigned int* patchNumCount;
   size_t patchNumCountSize;

   int* patchReadyQueue;
   size_t patchReadyQueueSize;

   float *force_x, *force_y, *force_z, *force_w;
   size_t forceSize;
   float *forceSlow_x, *forceSlow_y, *forceSlow_z, *forceSlow_w;
   size_t forceSlowSize;

   // Drude/NbThole
   int *isDrude;
   size_t isDrudeSize;
   float* drudeAtomAlpha;
   size_t drudeAtomAlphaSize;
 public:
   CudaComputeNonbondedKernel(int deviceID, CudaNonbondedTables& cudaNonbondedTables, bool doStreaming);
   ~CudaComputeNonbondedKernel();

   static __device__ __host__ __forceinline__ int
   computeNumTiles(const int numAtoms, const int tilesize = BOUNDINGBOXSIZE) {
     return (numAtoms+tilesize-1)/tilesize;
   }

   static __device__ __host__ __forceinline__ int
   computeAtomPad(const int numAtoms, const int tilesize = BOUNDINGBOXSIZE) {
     return computeNumTiles(numAtoms, tilesize)*tilesize;
   }

   void updateVdwTypesExcl(const int atomStorageSize, const int* h_vdwTypes,
     const int2* h_exclIndexMaxDiff, const int* h_atomIndex, cudaStream_t stream);

   void updateVdwTypesExclOnGPU(CudaTileListKernel& tlKernel,
     const int numPatches, const int atomStorageSize, const bool alchOn,
     CudaLocalRecord* localRecords,
     const int* d_vdwTypes, const int* d_id, const int* d_sortOrder,
     const int* d_partition, cudaStream_t stream);

   void nonbondedForce(CudaTileListKernel& tlKernel,
   const int atomStorageSize, const bool atomsChanged,
   const bool doMinimize, const bool doPairlist,
   const bool doEnergy, const bool doVirial, const bool doSlow, const bool doAlch,
   const bool doAlchVdwForceSwitching,
   const bool doFEP, const bool doTI,
   const bool doNbThole, const bool doTable,
   const float3 lata, const float3 latb, const float3 latc,
   const float4* h_xyzq, const float cutoff2,
   const CudaNBConstants nbConstants,
   float4* d_forces, float4* d_forcesSlow,
   float4* h_forces, float4* h_forcesSlow, AlchData *srcFlags,
   bool lambdaWindowUpdated, char *part,
   bool CUDASOAintegratorOn, bool useDeviceMigration,
   const float drudeNbtholeCut2,
   cudaStream_t stream);

   void reduceVirialEnergy(CudaTileListKernel& tlKernel,
     const int atomStorageSize, const bool doEnergy, const bool doVirial, const bool doSlow, const bool doGBIS,
     float4* d_forces, float4* d_forcesSlow,
     VirialEnergy* d_virialEnergy, cudaStream_t stream);

   void getVirialEnergy(VirialEnergy* h_virialEnergy, cudaStream_t stream);

   void bindExclusions(int numExclusions, unsigned int* exclusion_bits);

   int* getPatchReadyQueue();

   void reallocate_forceSOA(int atomStorageSize);

   void setExclusionsByAtom(int2* h_data, const int num_atoms);

   void updateDrudeData(const int atomStorageSize, const float* h_drudeAtomAlpha, const int* h_isDrude, cudaStream_t stream);
 };

 #endif // NAMD_HIP
 #endif // CUDACOMPUTENONBONDEDKERNEL_H
CudaUtils.h

AlchData::vdwLambda2Down
float vdwLambda2Down
Definition: CudaComputeNonbondedKernel.h:43

AlchData::vdwShift2Down
float vdwShift2Down
Definition: CudaComputeNonbondedKernel.h:48

AlchData
Alchemical datastructure that holds the lambda-relevant paramenters for FEP/TI.
Definition: CudaComputeNonbondedKernel.h:24

CudaComputeNonbondedKernel
Definition: CudaComputeNonbondedKernel.h:52

AlchData::elecLambda2Up
float elecLambda2Up
Definition: CudaComputeNonbondedKernel.h:40

CudaComputeNonbondedKernel::CudaComputeNonbondedKernel
CudaComputeNonbondedKernel(int deviceID, CudaNonbondedTables &cudaNonbondedTables, bool doStreaming)

CudaComputeNonbondedKernel::updateVdwTypesExcl
void updateVdwTypesExcl(const int atomStorageSize, const int *h_vdwTypes, const int2 *h_exclIndexMaxDiff, const int *h_atomIndex, cudaStream_t stream)

AlchData::vdwLambda2Up
float vdwLambda2Up
Definition: CudaComputeNonbondedKernel.h:42

AlchData::cutoff2
float cutoff2
Definition: CudaComputeNonbondedKernel.h:27

HipDefines.h

AlchData::elecLambdaDown
float elecLambdaDown
Definition: CudaComputeNonbondedKernel.h:34

CudaTileListKernel
Definition: CudaTileListKernel.h:121

CudaLocalRecord
Definition: CudaRecord.h:35

AlchData::vdwLambdaDown
float vdwLambdaDown
Definition: CudaComputeNonbondedKernel.h:36

CudaComputeNonbondedKernel::updateDrudeData
void updateDrudeData(const int atomStorageSize, const float *h_drudeAtomAlpha, const int *h_isDrude, cudaStream_t stream)

AlchData::lambdaUp
float lambdaUp
Definition: CudaComputeNonbondedKernel.h:31

CudaComputeNonbondedKernel::~CudaComputeNonbondedKernel
~CudaComputeNonbondedKernel()

CudaComputeNonbondedKernel::reallocate_forceSOA
void reallocate_forceSOA(int atomStorageSize)

AlchData::alchDecouple
bool alchDecouple
Definition: CudaComputeNonbondedKernel.h:49

AlchData::elecLambdaUp
float elecLambdaUp
Definition: CudaComputeNonbondedKernel.h:33

AlchData::vdwShift2Up
float vdwShift2Up
Definition: CudaComputeNonbondedKernel.h:46

CudaNBConstants
Definition: CudaUtils.h:593

CudaComputeNonbondedKernel::bindExclusions
void bindExclusions(int numExclusions, unsigned int *exclusion_bits)

VirialEnergy
Definition: CudaTileListKernel.h:98

CudaComputeNonbondedKernel::computeAtomPad
static __device__ __host__ __forceinline__ int computeAtomPad(const int numAtoms, const int tilesize=WARPSIZE)
Definition: CudaComputeNonbondedKernel.h:101

CudaNonbondedTables
Definition: CudaNonbondedTables.h:16

BOUNDINGBOXSIZE
#define BOUNDINGBOXSIZE
Definition: CudaUtils.h:18

AlchData::scaling
float scaling
Definition: CudaComputeNonbondedKernel.h:25

CudaComputeNonbondedKernel::reduceVirialEnergy
void reduceVirialEnergy(CudaTileListKernel &tlKernel, const int atomStorageSize, const bool doEnergy, const bool doVirial, const bool doSlow, const bool doGBIS, float4 *d_forces, float4 *d_forcesSlow, VirialEnergy *d_virialEnergy, cudaStream_t stream)

CudaComputeNonbondedKernel::nonbondedForce
void nonbondedForce(CudaTileListKernel &tlKernel, const int atomStorageSize, const bool atomsChanged, const bool doMinimize, const bool doPairlist, const bool doEnergy, const bool doVirial, const bool doSlow, const bool doAlch, const bool doAlchVdwForceSwitching, const bool doFEP, const bool doTI, const bool doNbThole, const bool doTable, const float3 lata, const float3 latb, const float3 latc, const float4 *h_xyzq, const float cutoff2, const CudaNBConstants nbConstants, float4 *d_forces, float4 *d_forcesSlow, float4 *h_forces, float4 *h_forcesSlow, AlchData *fepFlags, bool lambdaWindowUpdated, char *part, bool CUDASOAintegratorOn, bool useDeviceMigration, const float drudeNbtholeCut2, cudaStream_t stream)

AlchData::lambdaDown
float lambdaDown
Definition: CudaComputeNonbondedKernel.h:32

CudaComputeNonbondedKernel::setExclusionsByAtom
void setExclusionsByAtom(int2 *h_data, const int num_atoms)

CudaComputeNonbondedKernel::updateVdwTypesExclOnGPU
void updateVdwTypesExclOnGPU(CudaTileListKernel &tlKernel, const int numPatches, const int atomStorageSize, const bool alchOn, CudaLocalRecord *localRecords, const int *d_vdwTypes, const int *d_id, const int *d_sortOrder, const int *d_partition, cudaStream_t stream)

CudaComputeNonbondedKernel::getVirialEnergy
void getVirialEnergy(VirialEnergy *h_virialEnergy, cudaStream_t stream)

CudaTileListKernel.hip.h

CudaComputeNonbondedKernel::computeNumTiles
static __device__ __host__ __forceinline__ int computeNumTiles(const int numAtoms, const int tilesize=WARPSIZE)
Definition: CudaComputeNonbondedKernel.h:96

CudaComputeNonbondedKernel::getPatchReadyQueue
int * getPatchReadyQueue()

AlchData::vdwLambdaUp
float vdwLambdaUp
Definition: CudaComputeNonbondedKernel.h:35

AlchData::vdwShiftDown
float vdwShiftDown
Definition: CudaComputeNonbondedKernel.h:47

AlchData::lambda2Down
float lambda2Down
Definition: CudaComputeNonbondedKernel.h:39

AlchData::lambda2Up
float lambda2Up
Definition: CudaComputeNonbondedKernel.h:38

CudaNonbondedTables.h

AlchData::vdwShiftUp
float vdwShiftUp
Definition: CudaComputeNonbondedKernel.h:45

AlchData::elecLambda2Down
float elecLambda2Down
Definition: CudaComputeNonbondedKernel.h:41

AlchData::switchfactor
float switchfactor
Definition: CudaComputeNonbondedKernel.h:28

AlchData::switchdist2
float switchdist2
Definition: CudaComputeNonbondedKernel.h:26

AlchData::alchVdwShiftCoeff
float alchVdwShiftCoeff
Definition: CudaComputeNonbondedKernel.h:29

CudaRecord.h