namd/doxygen/ComputeRestraintsCUDA_8C_source.html

 #include "ComputeRestraintsCUDA.h"
 #include "Molecule.h"
 #include "Node.h"
 #include "HomePatch.h"
 #include "SimParameters.h"
 #include "ComputeRestraintsCUDAKernel.h"
 #define MIN_DEBUG_LEVEL 2
 //#define DEBUGM
 #include "Debug.h"

 #ifdef NODEGROUP_FORCE_REGISTER

 ComputeRestraintsCUDA::ComputeRestraintsCUDA(
   std::vector<HomePatch*> &patchList,
   std::vector<AtomMap*> &atomMapsList,
   cudaStream_t stream,
   bool _mGpuOn
 ) {

   mGpuOn=_mGpuOn;
   Molecule *molecule       = Node::Object()->molecule;
   SimParameters *simParams = Node::Object()->simParameters;
   nConstrainedAtoms = 0;
   // Set the constraints flags
   consExp = simParams->constraintExp;
   // consScaling = simParams->constraintScaling;

   // Selective constraints flags
   selConsOn = simParams->selectConstraintsOn;

   if (selConsOn){
     consSelectX = simParams->constrXOn;
     consSelectY = simParams->constrYOn;
     consSelectZ = simParams->constrZOn;
   }

   // Moving Constraints flags
   movConsOn = simParams->movingConstraintsOn;
   if (movConsOn) {
     moveVel.x = simParams->movingConsVel.x;
     moveVel.y = simParams->movingConsVel.y;
     moveVel.z = simParams->movingConsVel.z;
   }

   // Rotating cosntraints flags
   rotConsOn = simParams->rotConstraintsOn;
   if (rotConsOn) {
     rotVel = simParams->rotConsVel; // velocity is a scalar here
     rotAxis.x = simParams->rotConsAxis.x;
     rotAxis.y = simParams->rotConsAxis.y;
     rotAxis.z = simParams->rotConsAxis.z;
   }

   // Spherical Constraints flags
   spheConsOn = simParams->sphericalConstraintsOn;
   if(spheConsOn){
     spheConsCenter.x = simParams->sphericalConstrCenter.x;
     spheConsCenter.y = simParams->sphericalConstrCenter.y;
     spheConsCenter.z = simParams->sphericalConstrCenter.z;
   }

   // Set all flags, now allocate constraints data structures
   // We need to go through the molecule and add stuff to a constraint vector
   int numAtoms = molecule->numAtoms;
   for(int gid = 0; gid < numAtoms; gid++){
     if (molecule->is_atom_constrained(gid)){
       nConstrainedAtoms++;
       constrainedAtomsIndexMap[gid]=h_constrainedID.size();
       h_constrainedID.push_back(gid); // Pushes back global ID vector
       float k;
       Vector refPos;
       molecule->get_cons_params(k, refPos, gid);
       h_k.push_back(k);
       h_cons_x.push_back(refPos.x);
       h_cons_y.push_back(refPos.y);
       h_cons_z.push_back(refPos.z);
     }
   }
   this->stream = stream;

   allocate_host<int>(&h_constrainedSOA, nConstrainedAtoms);
   allocate_device<unsigned int>(&d_tbcatomic, 1);
   allocate_device<int>(&d_constrainedSOA, nConstrainedAtoms);
   allocate_device<int>(&d_constrainedID, nConstrainedAtoms);
   allocate_device<double>(&d_k, nConstrainedAtoms);
   allocate_device<double>(&d_cons_x, nConstrainedAtoms);
   allocate_device<double>(&d_cons_y, nConstrainedAtoms);
   allocate_device<double>(&d_cons_z, nConstrainedAtoms);

   copy_HtoD_sync<double>(h_k.data(), d_k, nConstrainedAtoms);
   copy_HtoD_sync<double>(h_cons_x.data(), d_cons_x, nConstrainedAtoms);
   copy_HtoD_sync<double>(h_cons_y.data(), d_cons_y, nConstrainedAtoms);
   copy_HtoD_sync<double>(h_cons_z.data(), d_cons_z, nConstrainedAtoms);
   copy_HtoD_sync<int>(h_constrainedID.data(), d_constrainedID, nConstrainedAtoms);

   cudaCheck(cudaMemset(d_tbcatomic, 0, sizeof(unsigned int))); // sets the scalar to zero

   // this->updateRestrainedAtoms(atomMapsList, h_globalToLocalID, h_patchOffsets);
 }

 void ComputeRestraintsCUDA::updateRestrainedAtoms(
   std::vector<AtomMap*> &atomMapsList,
   std::vector<CudaLocalRecord> &localRecords,
   const int* h_globalToLocalID
 ){
   // JM NOTE: This gets called for every migration step, so it would be good to have this somewhat fast
   // This is serialized, so if we have a lot of constrained atoms, it might become a bottleneck in the future
   DebugM(4, "ComputeGridForceCUDA::updateRestrainedAtoms "<< nConstrainedAtoms <<"\n"<< endi);
   constrainedLocalAtomsIndex.clear();
   int gid;

   for(int i = 0; i < nConstrainedAtoms; i++){
     // translates the global ID to the SOA ID.
     gid = h_constrainedID[i];
     LocalID lid;
     // Search for a valid localID in all atoms
     for(int j = 0 ; j < atomMapsList.size(); j++){
       lid = atomMapsList[j]->localID(gid);
       if( lid.pid != -1) break;
     }

     //JM NOTE: Fields of lid need to be != -1, bc the atom needs to be somewhere
     //          otherwise we have a bug
     // unless mGpuOn, then it is in a patch not on our device
     if(lid.pid == -1) {
         if(!mGpuOn)
           NAMD_bug(" LocalAtomID not found in patchMap");
     }
     else
       {
         // JM: Now that we have a patchID and a localPosition inside the patch, I can figure out
         //     the SOA position for each constrained atom

         int soaPid = h_globalToLocalID[lid.pid]; // Converts global patch ID to its local position in our SOA data structures
         int soaIndex = localRecords[soaPid].bufferOffset + lid.index;
         int mapoffset= constrainedAtomsIndexMap[gid];
         h_constrainedSOA[mapoffset] = soaIndex;
         constrainedLocalAtomsIndex.push_back(mapoffset);
         DebugM(2, "ComputeRestraintsCUDA::updateRestrainedAtoms gid " << gid <<" mapoffset "<< mapoffset << " constrainedLocalAtomsIndexSize "<<constrainedLocalAtomsIndex.size() <<"\n" << endi);
       }
   }

   // Copy the h_constrainedSOA data structure over to the GPU
   copy_HtoD_sync<int>(h_constrainedSOA, d_constrainedSOA, nConstrainedAtoms);
   int* idxPtr = constrainedLocalAtomsIndex.data();
   // Copy the indices for this device over to the GPU
   copy_HtoD_sync<int>(idxPtr, d_constrainedID, constrainedLocalAtomsIndex.size());

 }

 // doForce is called every time step, so no copies here
 void ComputeRestraintsCUDA::doForce(
   const Lattice *lat,
   const bool doEnergy,
   const bool doVirial,
   const int timeStep,
   double* d_pos_x,
   double* d_pos_y,
   double* d_pos_z,

   double* f_normal_x,
   double* f_normal_y,
   double* f_normal_z,
   double* d_bcEnergy,
   double* h_bcEnergy,
   double3* d_netForce,
   double3* h_netForce,
   cudaTensor* d_virial,
   cudaTensor* h_virial
 ){
   if (constrainedLocalAtomsIndex.empty()) return;
   SimParameters *simParams = Node::Object()->simParameters;

   computeRestrainingForce(
     doEnergy,
     doVirial,
     timeStep,
     constrainedLocalAtomsIndex.size(),
     consExp,
     // consScaling,
     simParams->constraintScaling, // read directly from SimParameters
         // to make sure we always calculate using latest value
     movConsOn,
     rotConsOn,
     selConsOn,
     spheConsOn,
     consSelectX,
     consSelectY,
     consSelectZ,
     rotVel,
     rotAxis,
     rotPivot,
     moveVel,
     spheConsCenter,
     d_constrainedSOA,
     d_constrainedID,
     d_pos_x,
     d_pos_y,
     d_pos_z,
     d_k,
     d_cons_x,
     d_cons_y,
     d_cons_z,
     f_normal_x,
     f_normal_y,
     f_normal_z,
     d_bcEnergy,
     h_bcEnergy,
     d_netForce,
     h_netForce,
     lat,
     d_virial,
     h_virial,
     rotationMatrix,
     d_tbcatomic,
     stream
   );

 }


 ComputeRestraintsCUDA::~ComputeRestraintsCUDA()
 {
   deallocate_device<unsigned int>(&d_tbcatomic);
   deallocate_device<int>(&d_constrainedSOA);
   deallocate_device<int>(&d_constrainedID);
   deallocate_device<double>(&d_cons_x);
   deallocate_device<double>(&d_cons_y);
   deallocate_device<double>(&d_cons_z);
   deallocate_device<double>(&d_k);
 }

 #endif // NODEGROUP_FORCE_REGISTER
Node::Object
static Node * Object()
Definition: Node.h:86

ComputeRestraintsCUDA.h

Debug.h

HomePatch.h

SimParameters
Definition: SimParameters.h:102

Vector
Definition: Vector.h:72

Node::simParameters
SimParameters * simParameters
Definition: Node.h:181

Node.h

DebugM
#define DebugM(x, y)
Definition: Debug.h:75

endi
std::ostream & endi(std::ostream &s)
Definition: InfoStream.C:54

Vector::z
BigReal z
Definition: Vector.h:74

LocalID
Definition: NamdTypes.h:287

Molecule
Molecule stores the structural information for the system.
Definition: Molecule.h:175

LocalID::index
int32 index
Definition: NamdTypes.h:290

ComputeRestraintsCUDAKernel.h

Molecule.h

NAMD_bug
void NAMD_bug(const char *err_msg)
Definition: common.C:195

Molecule::get_cons_params
void get_cons_params(Real &k, Vector &refPos, int atomnum) const
Definition: Molecule.h:1349

Vector::x
BigReal x
Definition: Vector.h:74

Molecule::numAtoms
int numAtoms
Definition: Molecule.h:585

LocalID::pid
PatchID pid
Definition: NamdTypes.h:289

simParams
#define simParams
Definition: Output.C:129

Vector::y
BigReal y
Definition: Vector.h:74

cudaTensor
Definition: CudaUtils.h:75

cudaCheck
#define cudaCheck(stmt)
Definition: CudaUtils.h:233

Lattice
Definition: Lattice.h:17

Molecule::is_atom_constrained
Bool is_atom_constrained(int atomnum) const
Definition: Molecule.h:1265

Node::molecule
Molecule * molecule
Definition: Node.h:179

SimParameters.h