|
|
static int | deviceParallelExecutionSize (const DeviceInformation &deviceInfo) |
| |
|
template<int order, bool computeSplines, bool spreadCharges, bool wrapX, bool wrapY, int mode, bool writeGlobal, ThreadsPerAtom threadsPerAtom, int parallelExecutionWidth> |
| __global__ void | pmeSplineAndSpreadKernel (PmeGpuKernelParams kernelParams) |
| | PME HIP kernels forward declarations. Kernels are documented in their respective files.
|
| |
|
template<GridOrdering gridOrdering, bool computeEnergyAndVirial, const int gridIndex, int parallelExecutionWidth> |
| __global__ void | pmeSolveKernel (PmeGpuKernelParams kernelParams) |
| |
|
template<int order, bool wrapX, bool wrapY, int nGrids, bool readGlobal, ThreadsPerAtom threadsPerAtom, int parallelExecutionWidth> |
| __global__ void | pmeGatherKernel (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, true, true, true, 1, true, ThreadsPerAtom::Order, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, false, true, true, 1, true, ThreadsPerAtom::Order, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, false, true, true, true, 1, true, ThreadsPerAtom::Order, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, true, true, true, 1, false, ThreadsPerAtom::Order, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, true, true, true, 1, true, ThreadsPerAtom::OrderSquared, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, false, true, true, 1, true, ThreadsPerAtom::OrderSquared, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, false, true, true, true, 1, true, ThreadsPerAtom::OrderSquared, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, true, true, true, 1, false, ThreadsPerAtom::OrderSquared, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, true, true, true, 2, true, ThreadsPerAtom::Order, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, false, true, true, 2, true, ThreadsPerAtom::Order, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, false, true, true, true, 2, true, ThreadsPerAtom::Order, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, true, true, true, 2, false, ThreadsPerAtom::Order, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, true, true, true, 2, true, ThreadsPerAtom::OrderSquared, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, false, true, true, 2, true, ThreadsPerAtom::OrderSquared, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, false, true, true, true, 2, true, ThreadsPerAtom::OrderSquared, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, true, true, true, 2, false, ThreadsPerAtom::OrderSquared, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeGatherKernel< 4, true, true, 1, true, ThreadsPerAtom::Order, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeGatherKernel< 4, true, true, 1, false, ThreadsPerAtom::Order, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeGatherKernel< 4, true, true, 1, true, ThreadsPerAtom::OrderSquared, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeGatherKernel< 4, true, true, 1, false, ThreadsPerAtom::OrderSquared, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeGatherKernel< 4, true, true, 2, true, ThreadsPerAtom::Order, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeGatherKernel< 4, true, true, 2, false, ThreadsPerAtom::Order, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeGatherKernel< 4, true, true, 2, true, ThreadsPerAtom::OrderSquared, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeGatherKernel< 4, true, true, 2, false, ThreadsPerAtom::OrderSquared, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSolveKernel< GridOrdering::XYZ, false, c_stateA, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSolveKernel< GridOrdering::XYZ, true, c_stateA, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSolveKernel< GridOrdering::YZX, false, c_stateA, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSolveKernel< GridOrdering::YZX, true, c_stateA, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSolveKernel< GridOrdering::XYZ, false, c_stateB, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSolveKernel< GridOrdering::XYZ, true, c_stateB, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSolveKernel< GridOrdering::YZX, false, c_stateB, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSolveKernel< GridOrdering::YZX, true, c_stateB, 32 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, true, true, true, 1, true, ThreadsPerAtom::Order, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, false, true, true, 1, true, ThreadsPerAtom::Order, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, false, true, true, true, 1, true, ThreadsPerAtom::Order, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, true, true, true, 1, false, ThreadsPerAtom::Order, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, true, true, true, 1, true, ThreadsPerAtom::OrderSquared, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, false, true, true, 1, true, ThreadsPerAtom::OrderSquared, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, false, true, true, true, 1, true, ThreadsPerAtom::OrderSquared, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, true, true, true, 1, false, ThreadsPerAtom::OrderSquared, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, true, true, true, 2, true, ThreadsPerAtom::Order, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, false, true, true, 2, true, ThreadsPerAtom::Order, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, false, true, true, true, 2, true, ThreadsPerAtom::Order, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, true, true, true, 2, false, ThreadsPerAtom::Order, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, true, true, true, 2, true, ThreadsPerAtom::OrderSquared, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, false, true, true, 2, true, ThreadsPerAtom::OrderSquared, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, false, true, true, true, 2, true, ThreadsPerAtom::OrderSquared, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSplineAndSpreadKernel< 4, true, true, true, true, 2, false, ThreadsPerAtom::OrderSquared, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeGatherKernel< 4, true, true, 1, true, ThreadsPerAtom::Order, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeGatherKernel< 4, true, true, 1, false, ThreadsPerAtom::Order, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeGatherKernel< 4, true, true, 1, true, ThreadsPerAtom::OrderSquared, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeGatherKernel< 4, true, true, 1, false, ThreadsPerAtom::OrderSquared, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeGatherKernel< 4, true, true, 2, true, ThreadsPerAtom::Order, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeGatherKernel< 4, true, true, 2, false, ThreadsPerAtom::Order, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeGatherKernel< 4, true, true, 2, true, ThreadsPerAtom::OrderSquared, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeGatherKernel< 4, true, true, 2, false, ThreadsPerAtom::OrderSquared, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSolveKernel< GridOrdering::XYZ, false, c_stateA, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSolveKernel< GridOrdering::XYZ, true, c_stateA, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSolveKernel< GridOrdering::YZX, false, c_stateA, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSolveKernel< GridOrdering::YZX, true, c_stateA, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSolveKernel< GridOrdering::XYZ, false, c_stateB, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSolveKernel< GridOrdering::XYZ, true, c_stateB, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSolveKernel< GridOrdering::YZX, false, c_stateB, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template __global__ void | pmeSolveKernel< GridOrdering::YZX, true, c_stateB, 64 > (PmeGpuKernelParams kernelParams) |
| |
|
template<int parallelExecutionWidth> |
| static void | setKernelPointersAndParams (struct PmeGpuProgramImpl *pmeGpuProgram) |
| | Helper function to set proper kernel functor pointers.
|
| |