CVS diff ComputeNonbondedCUDA.C

Difference for src/ComputeNonbondedCUDA.C from version 1.100 to 1.101

version 1.100

version 1.101

Line 798

// Zero array sizes and pointers

init_arrays();

atoms_size = 0;

atoms = NULL;

forces_size = 0;

forces = NULL;

Line 816

Line 819

if ( master->slavePes[slaveIndex] != CkMyPe() ) {

NAMD_bug("ComputeNonbondedCUDA slavePes[slaveIndex] != CkMyPe");

}

deviceID = master->deviceID;

registerPatches();

return;

}

Line 848

Line 852

cuda_errcheck("in cudaDeviceGetStreamPriorityRange");

if ( leastPriority != greatestPriority ) {

if ( CkMyNode() == 0 ) {

int dev;

int dev = deviceCUDA->getDeviceID();

cudaGetDevice(&dev);

cuda_errcheck("cudaGetDevice");

CkPrintf("CUDA device %d stream priority range %d %d\n", dev, leastPriority, greatestPriority);

}

if ( deviceCUDA->getMergeGrids() && params->PMEOn && params->PMEOffload ) {

if ( deviceCUDA->getMergeGrids() && params->PMEOn && params->PMEOffload && !params->usePMECUDA) {

greatestPriority = leastPriority;

}

if (params->usePMECUDA) greatestPriority = leastPriority;

cudaStreamCreateWithPriority(&stream,cudaStreamDefault,greatestPriority);

cudaStreamCreateWithPriority(&stream2,cudaStreamDefault,leastPriority);

} else

Line 863

Line 866

{

cudaStreamCreate(&stream);

cuda_errcheck("cudaStreamCreate");

int dev;

int dev = deviceCUDA->getDeviceID();

cudaGetDevice(&dev);

cuda_errcheck("cudaGetDevice");

cudaDeviceProp deviceProp;

cudaGetDeviceProperties(&deviceProp, dev);

cuda_errcheck("cudaGetDeviceProperties");

Line 878

Line 879

}

cuda_errcheck("cudaStreamCreate");

// Get GPU device ID

deviceID = deviceCUDA->getDeviceID();

cuda_init();

if ( max_grid_size < 65535 ) NAMD_bug("bad CUDA max_grid_size");

build_exclusions();

Line 890

Line 894

patch_pairs_ptr = new ResizeArray<patch_pair>;

patch_pair_num_ptr = new ResizeArray<int>;

if ( params->PMEOn && params->PMEOffload ) deviceCUDA->setGpuIsMine(0);

if ( params->PMEOn && params->PMEOffload && !params->usePMECUDA) deviceCUDA->setGpuIsMine(0);

}

Line 1152

Line 1156

static __thread int vdw_types_size;

static __thread int* vdw_types;

static __thread int atoms_size;

static __thread atom* atoms;

static __thread int dummy_size;

static __thread float* dummy_dev;

Line 1218

Line 1219

vdw_types_size = 0;

vdw_types = NULL;

atoms_size = 0;

atoms = NULL;

dummy_size = 0;

dummy_dev = NULL;

Line 1433

Line 1431

}

int ComputeNonbondedCUDA::noWork() {

//fprintf(stderr, "ComputeNonbondedCUDA::noWork() %d\n",CkMyPe());

SimParameters *simParams = Node::Object()->simParameters;

Flags &flags = master->patchRecords[hostedPatches[0]].p->flags;

Line 1501

Line 1498

GBISP("C.N.CUDA[%d]::doWork: seq %d, phase %d, workStarted %d, atomsChanged %d\n", \

CkMyPe(), sequence(), gbisPhase, workStarted, atomsChanged);

// Set GPU device ID

cudaCheck(cudaSetDevice(deviceID));

ResizeArray<patch_pair> &patch_pairs(*patch_pairs_ptr);

ResizeArray<int> &patch_pair_num(*patch_pair_num_ptr);

Line 1698

num_remote_atoms = num_atoms - num_local_atoms;

reallocate_host<atom_param>(&atom_params, &atom_params_size, num_atoms, 1.2f);

reallocate_host<int>(&vdw_types, &vdw_types_size, num_atoms, 1.2f);

reallocate_host<atom>(&atoms, &atoms_size, num_atoms, 1.2f);

reallocate_host<CudaAtom>(&atoms, &atoms_size, num_atoms, 1.2f);

reallocate_host<float4>(&forces, &forces_size, num_atoms, 1.2f, cudaHostAllocMapped);

reallocate_host<float4>(&slow_forces, &slow_forces_size, num_atoms, 1.2f, cudaHostAllocMapped);

if (simParams->GBISOn) {

Line 1779

{

#if 1

const CudaAtom *ac = pr.p->getCudaAtomList();

atom *ap = atoms + start;

CudaAtom *ap = atoms + start;

memcpy(ap, ac, sizeof(atom)*n);

#else

Vector center =

Line 1796

}

//GBISP("finished active patches\n")

//CkPrintf("maxMovement = %f maxTolerance = %f save = %d use = %d\n",

// maxAtomMovement, maxPatchTolerance,

// flags.savePairlists, flags.usePairlists);

savePairlists = 0;

usePairlists = 0;

if ( flags.savePairlists ) {

Line 1978

Line 1972

latc.z = lattice.c().z;

SimParameters *simParams = Node::Object()->simParameters;

// Set GPU device ID

cudaSetDevice(deviceID);

const bool streaming = ! (deviceCUDA->getNoStreaming() || simParams->GBISOn);

double walltime;

Line 2009

Line 2006

}

atomsChanged = 0;

cuda_bind_atoms(atoms);

cuda_bind_atoms((const atom *)atoms);

cuda_bind_forces(forces, slow_forces);

cuda_bind_virials(virials, force_ready_queue, block_order);

if ( simParams->GBISOn) {

Line 2171

Line 2168

}

} // phases

} // GBISOn

if ( simParams->PMEOn && simParams->PMEOffload ) break;

if ( simParams->PMEOn && simParams->PMEOffload && !simParams->usePMECUDA) break;

default:

GBISP("C.N.CUDA[%d]::recvYieldDevice: case default\n", CkMyPe())

Legend:

Removed in v.1.100
changed lines
	Added in v.1.101

Made by using version 1.53 of cvs2html