NAMD
|
#include "HipDefines.h"
Go to the source code of this file.
Classes | |
struct | TransposeBatch< T > |
Functions | |
void | spread_charge (const float4 *atoms, const int numAtoms, const int nfftx, const int nffty, const int nfftz, const int xsize, const int ysize, const int zsize, const int xdim, const int y00, const int z00, const bool periodicY, const bool periodicZ, float *data, const int order, cudaStream_t stream) |
void | scalar_sum (const bool orderXYZ, const int nfft1, const int nfft2, const int nfft3, const int size1, const int size2, const int size3, const double kappa, const float recip1x, const float recip1y, const float recip1z, const float recip2x, const float recip2y, const float recip2z, const float recip3x, const float recip3y, const float recip3z, const double volume, const float *prefac1, const float *prefac2, const float *prefac3, const int k2_00, const int k3_00, const bool doEnergyVirial, double *energy, double *virial, float2 *data, cudaStream_t stream) |
void | gather_force (const float4 *atoms, const int numAtoms, const int nfftx, const int nffty, const int nfftz, const int xsize, const int ysize, const int zsize, const int xdim, const int y00, const int z00, const bool periodicY, const bool periodicZ, const float *data, const int order, float3 *force, const cudaTextureObject_t gridTexObj, cudaStream_t stream) |
void | transpose_xyz_yzx (const int nx, const int ny, const int nz, const int xsize_in, const int ysize_in, const int ysize_out, const int zsize_out, const float2 *data_in, float2 *data_out, cudaStream_t stream) |
void | batchTranspose_xyz_yzx (const int numBatches, TransposeBatch< float2 > *batches, const int max_nx, const int ny, const int nz, const int xsize_in, const int ysize_in, cudaStream_t stream) |
void | transpose_xyz_zxy (const int nx, const int ny, const int nz, const int xsize_in, const int ysize_in, const int zsize_out, const int xsize_out, const float2 *data_in, float2 *data_out, cudaStream_t stream) |
void | batchTranspose_xyz_zxy (const int numBatches, TransposeBatch< float2 > *batches, const int max_nx, const int ny, const int nz, const int xsize_in, const int ysize_in, cudaStream_t stream) |
void batchTranspose_xyz_yzx | ( | const int | numBatches, |
TransposeBatch< float2 > * | batches, | ||
const int | max_nx, | ||
const int | ny, | ||
const int | nz, | ||
const int | xsize_in, | ||
const int | ysize_in, | ||
cudaStream_t | stream | ||
) |
Definition at line 1390 of file CudaPmeSolverUtilKernel.cu.
References cudaCheck, TILEDIM, and TILEROWS.
Referenced by CudaPmeTranspose::transposeXYZtoYZX().
void batchTranspose_xyz_zxy | ( | const int | numBatches, |
TransposeBatch< float2 > * | batches, | ||
const int | max_nx, | ||
const int | ny, | ||
const int | nz, | ||
const int | xsize_in, | ||
const int | ysize_in, | ||
cudaStream_t | stream | ||
) |
Definition at line 1425 of file CudaPmeSolverUtilKernel.cu.
References cudaCheck, TILEDIM, and TILEROWS.
Referenced by CudaPmeTranspose::transposeXYZtoZXY().
void gather_force | ( | const float4 * | atoms, |
const int | numAtoms, | ||
const int | nfftx, | ||
const int | nffty, | ||
const int | nfftz, | ||
const int | xsize, | ||
const int | ysize, | ||
const int | zsize, | ||
const int | xdim, | ||
const int | y00, | ||
const int | z00, | ||
const bool | periodicY, | ||
const bool | periodicZ, | ||
const float * | data, | ||
const int | order, | ||
float3 * | force, | ||
const cudaTextureObject_t | gridTexObj, | ||
cudaStream_t | stream | ||
) |
Definition at line 1225 of file CudaPmeSolverUtilKernel.cu.
References atoms, cudaCheck, and cudaNAMD_bug().
void scalar_sum | ( | const bool | orderXYZ, |
const int | nfft1, | ||
const int | nfft2, | ||
const int | nfft3, | ||
const int | size1, | ||
const int | size2, | ||
const int | size3, | ||
const double | kappa, | ||
const float | recip1x, | ||
const float | recip1y, | ||
const float | recip1z, | ||
const float | recip2x, | ||
const float | recip2y, | ||
const float | recip2z, | ||
const float | recip3x, | ||
const float | recip3y, | ||
const float | recip3z, | ||
const double | volume, | ||
const float * | prefac1, | ||
const float * | prefac2, | ||
const float * | prefac3, | ||
const int | k2_00, | ||
const int | k3_00, | ||
const bool | doEnergyVirial, | ||
double * | energy, | ||
double * | virial, | ||
float2 * | data, | ||
cudaStream_t | stream | ||
) |
Definition at line 1158 of file CudaPmeSolverUtilKernel.cu.
References cudaCheck, M_PI, and WARPSIZE.
Referenced by CudaPmeKSpaceCompute::solve().
void spread_charge | ( | const float4 * | atoms, |
const int | numAtoms, | ||
const int | nfftx, | ||
const int | nffty, | ||
const int | nfftz, | ||
const int | xsize, | ||
const int | ysize, | ||
const int | zsize, | ||
const int | xdim, | ||
const int | y00, | ||
const int | z00, | ||
const bool | periodicY, | ||
const bool | periodicZ, | ||
float * | data, | ||
const int | order, | ||
cudaStream_t | stream | ||
) |
Definition at line 1072 of file CudaPmeSolverUtilKernel.cu.
References atoms, cudaCheck, cudaNAMD_bug(), if(), and WARPSIZE.
Referenced by CudaPmeRealSpaceCompute::spreadCharge().
void transpose_xyz_yzx | ( | const int | nx, |
const int | ny, | ||
const int | nz, | ||
const int | xsize_in, | ||
const int | ysize_in, | ||
const int | ysize_out, | ||
const int | zsize_out, | ||
const float2 * | data_in, | ||
float2 * | data_out, | ||
cudaStream_t | stream | ||
) |
Definition at line 1371 of file CudaPmeSolverUtilKernel.cu.
References cudaCheck, TILEDIM, and TILEROWS.
void transpose_xyz_zxy | ( | const int | nx, |
const int | ny, | ||
const int | nz, | ||
const int | xsize_in, | ||
const int | ysize_in, | ||
const int | zsize_out, | ||
const int | xsize_out, | ||
const float2 * | data_in, | ||
float2 * | data_out, | ||
cudaStream_t | stream | ||
) |
Definition at line 1406 of file CudaPmeSolverUtilKernel.cu.
References cudaCheck, TILEDIM, and TILEROWS.