namd/doxygen/CudaGlobalMasterClient_8C_source.html

 #include "CudaGlobalMasterClient.h"
 #include "CudaGlobalMasterClientKernel.h"
 #include "CudaGlobalMasterServer.h"
 #include "CudaUtils.h"
 #include "InfoStream.h"
 #include "Lattice.h"
 #include "Molecule.h"
 #include "ReductionMgr.h"
 #include "Node.h"
 #include "NamdState.h"
 #include "DataExchanger.h"
 #include "SimParameters.h"
 #include "ScriptTcl.h"

 namespace CudaGlobalMaster {

 #if (defined(NAMD_CUDA) || defined(NAMD_HIP)) && defined(NODEGROUP_FORCE_REGISTER)

 void CudaGlobalMasterClient::initialize(
   const std::vector<std::string>& arguments, int deviceID, cudaStream_t stream) {
   m_name = arguments[1];
   m_device_id = deviceID;
   const std::string msg = "Creating CudaGlobalMasterClient " + m_name +
                           " on PE " + std::to_string(CkMyPe()) + "\n";
   iout << iINFO << msg << endi;
   int savedDevice;
   cudaCheck(cudaGetDevice(&savedDevice));
   cudaCheck(cudaSetDevice(m_device_id));
   allocate_device(&m_d_ExtVirial, 1);
   allocate_device(&m_d_ExtForce, 1);
   allocate_host(&m_h_virial, 1);
   allocate_host(&m_h_ExtForce, 1);
   cudaCheck(cudaSetDevice(savedDevice));
 }

 CudaGlobalMasterClient::~CudaGlobalMasterClient() {
   if (m_d_ExtVirial)
     deallocate_device(&m_d_ExtVirial);
   if (m_d_ExtForce)
     deallocate_device(&m_d_ExtForce);
   if (m_h_virial)
     deallocate_host(&m_h_virial);
   if (m_h_ExtForce)
     deallocate_host(&m_h_ExtForce);
 }

 void CudaGlobalMasterClient::unsubscribe() {
   auto master = m_master.lock();
   if (master) {
     master->removeClient(shared_from_this());
     master.reset();
   } else {
     iout << iWARN << "Trying to remove client \"" << name()
          << "\" which is not in the master";
   }
 }

 void CudaGlobalMasterClient::subscribe(
     std::shared_ptr<CudaGlobalMasterServer> master) {
   auto tmp = m_master.lock();
   if (tmp) {
     return;
   } else {
     m_master = master;
     master->addClient(shared_from_this());
   }
 }

 int CudaGlobalMasterClient::updateFromTCLCommand(const std::vector<std::string>& arguments) {
   iout << iINFO << "Updating client " << name() << " with arguments:\n" << endi;
   for (size_t i = 0; i < arguments.size(); ++i) {
     iout << iINFO << "  arguments[" << i << "]: " << arguments[i] << '\n' << endi;
   }
 #ifdef NAMD_TCL
   return TCL_OK;
 #else
   return 0;
 #endif // NAMD_TCL
 }

 std::string CudaGlobalMasterClient::getTCLUpdateResult() {
   return "undefined";
 }

 bool CudaGlobalMasterClient::tclAvailable() const {
 #ifdef NAMD_TCL
   return true;
 #else
   return false;
 #endif // NAMD_TCL
 }

 void CudaGlobalMasterClient::finishReductions(bool doEnergy, bool doVirial,
                                               SubmitReduction *reduction) {
   if (doEnergy && hasEnergy()) {
     reduction->item(REDUCTION_MISC_ENERGY) += getEnergy();
   }
   if (useDefaultExtForceAndVirial()) {
     if (getRequestedAtoms().size() == getRequestedForcedAtoms().size()) {
       if (doVirial) {
         int savedDevice;
         cudaCheck(cudaGetDevice(&savedDevice));
         cudaCheck(cudaSetDevice(m_device_id));
         cudaCheck(cudaMemsetAsync(m_d_ExtVirial, 0, sizeof(cudaTensor), getStream()));
         cudaCheck(cudaMemsetAsync(m_d_ExtForce, 0, sizeof(Vector), getStream()));
         clientVirialAndExtForce(this->getPositions(), this->getAppliedForces(),
                                 this->getRequestedAtoms().size(), m_d_ExtVirial,
                                 m_d_ExtForce, getStream());
         copy_DtoH(m_d_ExtVirial, m_h_virial, 1, getStream());
         copy_DtoH(m_d_ExtForce, m_h_ExtForce, 1, getStream());
         cudaCheck(cudaStreamSynchronize(getStream()));
         ADD_TENSOR_OBJECT(reduction, REDUCTION_VIRIAL_NORMAL, (*m_h_virial));
         ADD_VECTOR_OBJECT(reduction, REDUCTION_EXT_FORCE_NORMAL, (*m_h_ExtForce));
         cudaCheck(cudaSetDevice(savedDevice));
       }
     } else {
       if (doVirial) {
         iout << iWARN << "Virial is not available for CudaGlobalMasterClient \""
             << name() << "\" since the number of atoms requested ("
             << std::to_string(getRequestedAtoms().size())
             << ") does not match the number of applied forces ("
             << std::to_string(getRequestedForcedAtoms().size()) << ")\n";
       }
     }
   } else {
     if (hasVirial()) {
       ADD_TENSOR_OBJECT(reduction, REDUCTION_VIRIAL_NORMAL, getVirial());
     }
     if (hasExtForce()) {
       ADD_VECTOR_OBJECT(reduction, REDUCTION_EXT_FORCE_NORMAL, getExtForce());
     }
   }
 }

 SimParameters* CudaGlobalMasterClient::getSimParameters() const {
   return Node::Object()->simParameters;
 }

 Molecule* CudaGlobalMasterClient::getMolecule() const {

   return Node::Object()->molecule;
 }

 const Controller* CudaGlobalMasterClient::getController() const {
   return &(Node::Object()->state->getController());
 }

 ScriptTcl* CudaGlobalMasterClient::getScript() {
 #ifdef NAMD_TCL
   return Node::Object()->getScript();
 #else
   return nullptr;
 #endif // NAMD_TCL
 }

 bool CudaGlobalMasterClient::replica_enabled() const {
 #if CMK_HAS_PARTITION
   return true;
 #else
   return false;
 #endif
 }

 int CudaGlobalMasterClient::replica_index() const {
   return CmiMyPartition();
 }

 int CudaGlobalMasterClient::num_replicas() const {
   return CmiNumPartitions();
 }

 void replica_comm_barrier() {
   replica_barrier();
 }

 int replica_comm_recv(char* msg_data, int buf_len, int src_rep) {
   DataMessage *recvMsg = NULL;
   replica_recv(&recvMsg, src_rep, CkMyPe());
   CmiAssert(recvMsg != NULL);
   int retval = recvMsg->size;
   if (buf_len >= retval) {
     memcpy(msg_data,recvMsg->data,retval);
   } else {
     retval = 0;
   }
   CmiFree(recvMsg);
   return retval;
 }

 int replica_comm_send(char* msg_data, int msg_len, int dest_rep) {
   replica_send(msg_data, msg_len, dest_rep, CkMyPe());
   return msg_len;
 }

 #else

 CudaGlobalMasterClient::CudaGlobalMasterClient() {
   NAMD_die("CudaGlobalMasterClient requires NAMD to be built with CUDA");
 }

 #endif // (defined(NAMD_CUDA) || defined(NAMD_HIP)) && defined(NODEGROUP_FORCE_REGISTER)
 }
Node::Object
static Node * Object()
Definition: Node.h:86

NamdState::getController
const Controller & getController() const
Definition: NamdState.h:51

CudaGlobalMasterClientKernel.h

CudaUtils.h

iINFO
std::ostream & iINFO(std::ostream &s)
Definition: InfoStream.C:81

Controller
Definition: Controller.h:105

deallocate_host
void deallocate_host(T **pp)
Definition: CudaUtils.h:396

SimParameters
Definition: SimParameters.h:139

Vector
Definition: Vector.h:72

ADD_TENSOR_OBJECT
#define ADD_TENSOR_OBJECT(R, RL, D)
Definition: ReductionMgr.h:44

Node::simParameters
SimParameters * simParameters
Definition: Node.h:181

deallocate_device
void deallocate_device(T **pp)
Definition: CudaUtils.h:342

allocate_device
void allocate_device(T **pp, const size_t len)
Definition: CudaUtils.h:320

Node.h

CudaGlobalMaster
Definition: ComputeMgr.h:56

SubmitReduction::item
BigReal & item(int i)
Definition: ReductionMgr.h:336

InfoStream.h

replica_send
void replica_send(const char *sndbuf, int sendcount, int destPart, int destPE)
Definition: DataExchanger.C:133

endi
std::ostream & endi(std::ostream &s)
Definition: InfoStream.C:54

DataMessage
Definition: DataExchanger.h:18

REDUCTION_MISC_ENERGY
Definition: ReductionMgr.h:107

iWARN
std::ostream & iWARN(std::ostream &s)
Definition: InfoStream.C:82

DataMessage::size
int size
Definition: DataExchanger.h:22

iout
#define iout
Definition: InfoStream.h:51

Molecule
Molecule stores the structural information for the system.
Definition: Molecule.h:174

ScriptTcl
Definition: ScriptTcl.h:22

Molecule.h

replica_recv
void replica_recv(DataMessage **precvMsg, int srcPart, int srcPE)
Definition: DataExchanger.C:144

ScriptTcl.h

SubmitReduction
Definition: ReductionMgr.h:326

CudaGlobalMasterServer.h

DataExchanger.h

Node::state
NamdState * state
Definition: Node.h:184

CudaGlobalMasterClient.h

allocate_host
void allocate_host(T **pp, const size_t len)
Definition: CudaUtils.h:305

replica_barrier
void replica_barrier()
Definition: DataExchanger.C:168

ReductionMgr.h

NAMD_die
void NAMD_die(const char *err_msg)
Definition: common.C:147

SynchronousCollectiveScope::master

copy_DtoH
void copy_DtoH(const T *d_array, T *h_array, const size_t array_len, cudaStream_t stream=0)
Definition: CudaUtils.h:436

DataMessage::data
char data[1]
Definition: DataExchanger.h:23

Node::getScript
ScriptTcl * getScript()
Definition: Node.C:1656

ADD_VECTOR_OBJECT
#define ADD_VECTOR_OBJECT(R, RL, D)
Definition: ReductionMgr.h:28

cudaTensor
Definition: CudaUtils.h:84

cudaCheck
#define cudaCheck(stmt)
Definition: CudaUtils.h:242

NamdState.h

Lattice.h

Node::molecule
Molecule * molecule
Definition: Node.h:179

SimParameters.h