CVS diff DeviceCUDA.h

Difference for src/DeviceCUDA.h from version 1.3 to 1.4

version 1.3

version 1.4

Line 1

#ifndef DEVICECUDA_H

#define DEVICECUDA_H

#ifdef NAMD_CUDA

#include <cuda_runtime.h>

#define CUDA_EVENT_ID_POLL_REMOTE 98

#define CUDA_TRACE_POLL_REMOTE \

traceUserEvent(CUDA_EVENT_ID_POLL_REMOTE)

Line 15

Line 18

do { int dev; cudaGetDevice(&dev); traceUserBracketEvent( \

CUDA_EVENT_ID_BASE + 2 * dev + 1, START, END); } while (0)

#ifdef WIN32

#define __thread __declspec(thread)

#endif

// Class that handles PE <=> CUDA device mapping

Line 34

Line 33

int nomergegrids;

int nostreaming;

// Number of devices on this node

int deviceCount;

// Number of devices on this node that are used for computation

int ndevices;

// List of device IDs that are used for computation

int *devices;

// True when GPU is shared between PEs

bool sharedGpu;

// Index of next GPU sharing this GPU

Line 46

Line 54

int *pesSharingDevice;

// True when what???

int gpuIsMine;

// Value of __CUDA_ARCH__

int cuda_arch;

// Device ID for this Pe

int deviceID;

// Device properties for all devices on this node

cudaDeviceProp* deviceProps;

void register_user_events();

Line 56

Line 71

void initialize();

int getDeviceCount() {return deviceCount;}

int getNumDevice() {return ndevices;}

bool device_shared_with_pe(int pe);

bool one_device_per_node();

Line 72

Line 90

int getGpuIsMine() {return gpuIsMine;}

void setGpuIsMine(const int val) {gpuIsMine = val;}

int get_cuda_arch() {return cuda_arch;}

int getDeviceID() {return deviceID;}

int getDeviceIDbyRank(int rank) {return devices[rank];}

int getDeviceIDforPe(int pe);

int getMasterPeForDeviceID(int deviceID);

int getMaxNumThreads();

int getMaxNumBlocks();

};

#endif //NAMD_CUDA

#endif // DEVICECUDA_H

Legend:

Removed in v.1.3
changed lines
	Added in v.1.4

Made by using version 1.53 of cvs2html