namd/doxygen/CudaGlobalMasterClient_8C_source.html

 #include "CudaGlobalMasterClient.h"
 #include "CudaGlobalMasterClientKernel.h"
 #include "CudaGlobalMasterServer.h"
 #include "CudaUtils.h"
 #include "InfoStream.h"
 #include "ReductionMgr.h"
 #include "Node.h"
 #include "NamdState.h"
 #include "DataExchanger.h"

 #if defined(NAMD_CUDA) && defined(NODEGROUP_FORCE_REGISTER)

 void CudaGlobalMasterClient::initialize(
   const std::vector<std::string>& arguments, int deviceID, cudaStream_t stream) {
   m_name = arguments[1];
   m_device_id = deviceID;
   const std::string msg = "Creating CudaGlobalMasterClient " + m_name +
                           " on PE " + std::to_string(CkMyPe()) + "\n";
   iout << iINFO << msg << endi;
   int savedDevice;
   cudaCheck(cudaGetDevice(&savedDevice));
   cudaCheck(cudaSetDevice(m_device_id));
   allocate_device(&m_d_ExtVirial, 1);
   allocate_device(&m_d_ExtForce, 1);
   cudaCheck(cudaSetDevice(savedDevice));
 }

 CudaGlobalMasterClient::~CudaGlobalMasterClient() {
   if (m_d_ExtVirial)
     deallocate_device(&m_d_ExtVirial);
   if (m_d_ExtForce)
     deallocate_device(&m_d_ExtForce);
 }

 void CudaGlobalMasterClient::unsubscribe() {
   auto master = m_master.lock();
   if (master) {
     master->removeClient(shared_from_this());
     master.reset();
   } else {
     iout << iWARN << "Trying to remove client \"" << name()
          << "\" which is not in the master";
   }
 }

 void CudaGlobalMasterClient::subscribe(
     std::shared_ptr<CudaGlobalMasterServer> master) {
   auto tmp = m_master.lock();
   if (tmp) {
     return;
   } else {
     m_master = master;
     master->addClient(shared_from_this());
   }
 }

 std::string CudaGlobalMasterClient::updateFromTCLCommand(const std::vector<std::string>& arguments) {
   iout << iINFO << "Updating client " << name() << " with arguments:\n" << endi;
   for (size_t i = 0; i < arguments.size(); ++i) {
     iout << iINFO << "  arguments[" << i << "]: " << arguments[i] << '\n' << endi;
   }
   return "undefined";
 }

 void CudaGlobalMasterClient::finishReductions(bool doEnergy, bool doVirial,
                                               NodeReduction *reduction) {
   if (doEnergy && hasEnergy()) {
 #ifdef NODEGROUP_FORCE_REGISTER
     reduction->item(REDUCTION_MISC_ENERGY) += getEnergy();
 #endif
   }
   if (useDefaultExtForceAndVirial()) {
     if (getRequestedAtoms().size() == getRequestedForcedAtoms().size()) {
       if (doVirial) {
         int savedDevice;
         cudaCheck(cudaGetDevice(&savedDevice));
         cudaCheck(cudaSetDevice(m_device_id));
         cudaCheck(cudaMemsetAsync(m_d_ExtVirial, 0, sizeof(cudaTensor), getStream()));
         cudaCheck(cudaMemsetAsync(m_d_ExtForce, 0, sizeof(Vector), getStream()));
         clientVirialAndExtForce(this->getPositions(), this->getAppliedForces(),
                                 this->getRequestedAtoms().size(), m_d_ExtVirial,
                                 m_d_ExtForce, getStream());
         cudaTensor h_virial;
         Vector extForce;
         copy_DtoH(m_d_ExtVirial, &h_virial, 1, getStream());
         copy_DtoH(m_d_ExtForce, &extForce, 1, getStream());
         cudaCheck(cudaStreamSynchronize(getStream()));
 #ifdef NODEGROUP_FORCE_REGISTER
         ADD_TENSOR_OBJECT(reduction, REDUCTION_VIRIAL_NORMAL, h_virial);
         ADD_VECTOR_OBJECT(reduction, REDUCTION_EXT_FORCE_NORMAL, extForce);
 #endif
         cudaCheck(cudaSetDevice(savedDevice));
       }
     } else {
       if (doVirial) {
         iout << iWARN << "Virial is not available for CudaGlobalMasterClient \""
             << name() << "\" since the number of atoms requested ("
             << std::to_string(getRequestedAtoms().size())
             << ") does not match the number of applied forces ("
             << std::to_string(getRequestedForcedAtoms().size()) << ")\n";
       }
     }
   } else {
 #ifdef NODEGROUP_FORCE_REGISTER
     if (hasVirial()) {
       ADD_TENSOR_OBJECT(reduction, REDUCTION_VIRIAL_NORMAL, getVirial());
     }
     if (hasEnergy()) {
       ADD_VECTOR_OBJECT(reduction, REDUCTION_EXT_FORCE_NORMAL, getExtForce());
     }
 #endif
   }
 }

 SimParameters* CudaGlobalMasterClient::getSimParameters() const {
   return Node::Object()->simParameters;
 }

 Molecule* CudaGlobalMasterClient::getMolecule() const {
   return Node::Object()->molecule;
 }

 const Controller* CudaGlobalMasterClient::getController() const {
   return &(Node::Object()->state->getController());
 }

 bool CudaGlobalMasterClient::replica_enabled() const {
 #if CMK_HAS_PARTITION
   return true;
 #else
   return false;
 #endif
 }

 int CudaGlobalMasterClient::replica_index() const {
   return CmiMyPartition();
 }

 int CudaGlobalMasterClient::num_replicas() const {
   return CmiNumPartitions();
 }

 void replica_comm_barrier() {
   replica_barrier();
 }

 int replica_comm_recv(char* msg_data, int buf_len, int src_rep) {
   DataMessage *recvMsg = NULL;
   replica_recv(&recvMsg, src_rep, CkMyPe());
   CmiAssert(recvMsg != NULL);
   int retval = recvMsg->size;
   if (buf_len >= retval) {
     memcpy(msg_data,recvMsg->data,retval);
   } else {
     retval = 0;
   }
   CmiFree(recvMsg);
   return retval;
 }

 int replica_comm_send(char* msg_data, int msg_len, int dest_rep) {
   replica_send(msg_data, msg_len, dest_rep, CkMyPe());
   return msg_len;
 }

 #else

 CudaGlobalMasterClient::CudaGlobalMasterClient(std::string name, int deviceID) {
   NAMD_die("CudaGlobalMasterClient requires NAMD to be built with CUDA");
 }

 #endif // defined(NAMD_CUDA) && defined(NODEGROUP_FORCE_REGISTER)
Node::Object
static Node * Object()
Definition: Node.h:86

NamdState::getController
const Controller & getController() const
Definition: NamdState.h:51

CudaGlobalMasterClientKernel.h

CudaUtils.h

iINFO
std::ostream & iINFO(std::ostream &s)
Definition: InfoStream.C:81

Controller
Definition: Controller.h:106

SimParameters
Definition: SimParameters.h:102

Vector
Definition: Vector.h:72

ADD_TENSOR_OBJECT
#define ADD_TENSOR_OBJECT(R, RL, D)
Definition: ReductionMgr.h:44

Node::simParameters
SimParameters * simParameters
Definition: Node.h:181

deallocate_device
void deallocate_device(T **pp)
Definition: CudaUtils.h:333

allocate_device
void allocate_device(T **pp, const size_t len)
Definition: CudaUtils.h:311

Node.h

InfoStream.h

replica_send
void replica_send(const char *sndbuf, int sendcount, int destPart, int destPE)
Definition: DataExchanger.C:133

endi
std::ostream & endi(std::ostream &s)
Definition: InfoStream.C:54

NodeReduction
Definition: ReductionMgr.h:364

DataMessage
Definition: DataExchanger.h:18

REDUCTION_MISC_ENERGY
Definition: ReductionMgr.h:106

iWARN
std::ostream & iWARN(std::ostream &s)
Definition: InfoStream.C:82

DataMessage::size
int size
Definition: DataExchanger.h:22

iout
#define iout
Definition: InfoStream.h:51

Molecule
Molecule stores the structural information for the system.
Definition: Molecule.h:175

replica_recv
void replica_recv(DataMessage **precvMsg, int srcPart, int srcPE)
Definition: DataExchanger.C:144

CudaGlobalMasterServer.h

NodeReduction::item
ReductionValue & item(int index)
Definition: ReductionMgr.C:633

DataExchanger.h

Node::state
NamdState * state
Definition: Node.h:184

CudaGlobalMasterClient.h

replica_barrier
void replica_barrier()
Definition: DataExchanger.C:168

ReductionMgr.h

NAMD_die
void NAMD_die(const char *err_msg)
Definition: common.C:147

copy_DtoH
void copy_DtoH(const T *d_array, T *h_array, const size_t array_len, cudaStream_t stream=0)
Definition: CudaUtils.h:427

DataMessage::data
char data[1]
Definition: DataExchanger.h:23

ADD_VECTOR_OBJECT
#define ADD_VECTOR_OBJECT(R, RL, D)
Definition: ReductionMgr.h:28

cudaTensor
Definition: CudaUtils.h:75

cudaCheck
#define cudaCheck(stmt)
Definition: CudaUtils.h:233

NamdState.h

CudaGlobalMasterClient::CudaGlobalMasterClient
CudaGlobalMasterClient(std::string name, int deviceID)
Definition: CudaGlobalMasterClient.C:168

Node::molecule
Molecule * molecule
Definition: Node.h:179