Add basic LJ potential*
- Add PairPotential Abstract class - Add Lennard-Jones potential that should work with both CUDA and C++ code - Add tests on HOST side for LJ potential
This commit is contained in:
parent
f15eb0cf51
commit
5155ec21aa
11 changed files with 114 additions and 154 deletions
|
@ -1,16 +1,14 @@
|
|||
project(${NAME}_cuda_lib CUDA CXX)
|
||||
|
||||
set(HEADER_FILES
|
||||
hello_world.h
|
||||
pair_potentials.cuh
|
||||
)
|
||||
set(SOURCE_FILES
|
||||
hello_world.cu
|
||||
)
|
||||
|
||||
# The library contains header and source files.
|
||||
add_library(${NAME}_cuda_lib STATIC
|
||||
add_library(${NAME}_cuda_lib INTERFACE
|
||||
${SOURCE_FILES}
|
||||
${HEADER_FILES}
|
||||
)
|
||||
|
||||
target_compile_options(${CMAKE_PROJECT_NAME}_cuda_lib PRIVATE -Wno-gnu-line-marker -Wno-pedantic)
|
||||
|
|
|
@ -1,46 +0,0 @@
|
|||
#include <cuda_runtime.h>
|
||||
#include <stdio.h>
|
||||
|
||||
__global__ void hello_cuda() {
|
||||
printf("Hello CUDA from thread %d\n", threadIdx.x);
|
||||
}
|
||||
|
||||
extern "C" void launch_hello_cuda() {
|
||||
// First check device properties
|
||||
cudaDeviceProp prop;
|
||||
cudaGetDeviceProperties(&prop, 1);
|
||||
printf("Using device: %s with compute capability %d.%d\n", prop.name,
|
||||
prop.major, prop.minor);
|
||||
|
||||
hello_cuda<<<1, 10>>>();
|
||||
cudaDeviceSynchronize();
|
||||
fflush(stdout);
|
||||
}
|
||||
|
||||
extern "C" void check_cuda() {
|
||||
int deviceCount = 0;
|
||||
cudaError_t error = cudaGetDeviceCount(&deviceCount);
|
||||
|
||||
if (error != cudaSuccess) {
|
||||
printf("CUDA error: %s\n", cudaGetErrorString(error));
|
||||
}
|
||||
|
||||
printf("Found %d CUDA devices\n", deviceCount);
|
||||
|
||||
for (int i = 0; i < deviceCount; i++) {
|
||||
cudaDeviceProp prop;
|
||||
cudaGetDeviceProperties(&prop, i);
|
||||
|
||||
printf("Device %d: %s\n", i, prop.name);
|
||||
printf(" Compute capability: %d.%d\n", prop.major, prop.minor);
|
||||
printf(" Total global memory: %.2f GB\n",
|
||||
static_cast<float>(prop.totalGlobalMem) / (1024 * 1024 * 1024));
|
||||
printf(" Multiprocessors: %d\n", prop.multiProcessorCount);
|
||||
printf(" Max threads per block: %d\n", prop.maxThreadsPerBlock);
|
||||
printf(" Max threads dimensions: (%d, %d, %d)\n", prop.maxThreadsDim[0],
|
||||
prop.maxThreadsDim[1], prop.maxThreadsDim[2]);
|
||||
printf(" Max grid dimensions: (%d, %d, %d)\n", prop.maxGridSize[0],
|
||||
prop.maxGridSize[1], prop.maxGridSize[2]);
|
||||
printf("\n");
|
||||
}
|
||||
}
|
|
@ -1,10 +0,0 @@
|
|||
#ifndef HELLO_WORLD_CU_H
|
||||
#define HELLO_WORLD_CU_H
|
||||
|
||||
extern "C" {
|
||||
// Declaration of the CUDA function that will be called from C++
|
||||
void launch_hello_cuda();
|
||||
void check_cuda();
|
||||
}
|
||||
|
||||
#endif // HELLO_WORLD_CU_H
|
91
kernels/pair_potentials.cuh
Normal file
91
kernels/pair_potentials.cuh
Normal file
|
@ -0,0 +1,91 @@
|
|||
#ifndef POTENTIALS_H
|
||||
#define POTENTIALS_H
|
||||
|
||||
#include "precision.hpp"
|
||||
#include "vec3.h"
|
||||
|
||||
#ifdef __CUDACC__
|
||||
#define CUDA_CALLABLE __host__ __device__
|
||||
#else
|
||||
#define CUDA_CALLABLE
|
||||
#endif
|
||||
|
||||
/**
|
||||
* Result struct for the Pair Potential
|
||||
*/
|
||||
struct ForceAndEnergy {
|
||||
real energy;
|
||||
Vec3<real> force;
|
||||
|
||||
CUDA_CALLABLE inline static ForceAndEnergy zero() {
|
||||
return {0.0, {0.0, 0.0, 0.0}};
|
||||
};
|
||||
};
|
||||
|
||||
/**
|
||||
* Abstract implementation of a Pair Potential.
|
||||
* Pair potentials are potentials which depend solely on the distance
|
||||
* between two particles. These do not include multi-body potentials such as
|
||||
* EAM
|
||||
*
|
||||
*/
|
||||
struct PairPotential {
|
||||
real m_rcutoffsq;
|
||||
|
||||
PairPotential(real rcutoff) : m_rcutoffsq(rcutoff * rcutoff) {};
|
||||
#ifdef __CUDACC__
|
||||
CUDA_CALLABLE ~PairPotential();
|
||||
#else
|
||||
virtual ~PairPotential() = 0;
|
||||
#endif
|
||||
|
||||
/**
|
||||
* Calculate the force and energy for a specific atom pair based on a
|
||||
* displacement vector r.
|
||||
*/
|
||||
CUDA_CALLABLE virtual ForceAndEnergy calc_force_and_energy(Vec3<real> r) = 0;
|
||||
};
|
||||
|
||||
/**
|
||||
* Calculate the Lennard-Jones energy and force for the current particle pair
|
||||
* described by displacement vector r
|
||||
*/
|
||||
struct LennardJones : PairPotential {
|
||||
real m_epsilon;
|
||||
real m_sigma;
|
||||
|
||||
CUDA_CALLABLE LennardJones(real sigma, real epsilon, real rcutoff)
|
||||
: PairPotential(rcutoff), m_epsilon(epsilon), m_sigma(sigma) {};
|
||||
|
||||
CUDA_CALLABLE ForceAndEnergy calc_force_and_energy(Vec3<real> r) {
|
||||
real rmagsq = r.squared_norm2();
|
||||
if (rmagsq < this->m_rcutoffsq && rmagsq > 0.0) {
|
||||
real inv_rmag = 1 / std::sqrt(rmagsq);
|
||||
|
||||
// Pre-Compute the terms (doing this saves on multiple devisions/pow
|
||||
// function call)
|
||||
real sigma_r = m_sigma * inv_rmag;
|
||||
real sigma_r6 = sigma_r * sigma_r * sigma_r * sigma_r * sigma_r * sigma_r;
|
||||
real sigma_r12 = sigma_r6 * sigma_r6;
|
||||
|
||||
// Get the energy
|
||||
real energy = 4.0 * m_epsilon * (sigma_r12 - sigma_r6);
|
||||
|
||||
// Get the force vector
|
||||
real force_mag =
|
||||
4.0 * m_epsilon *
|
||||
(12.0 * sigma_r12 * inv_rmag - 6.0 * sigma_r6 * inv_rmag);
|
||||
Vec3<real> force = r.scale(force_mag * inv_rmag);
|
||||
|
||||
return {energy, force};
|
||||
|
||||
} else {
|
||||
return ForceAndEnergy::zero();
|
||||
}
|
||||
};
|
||||
|
||||
~LennardJones() {};
|
||||
};
|
||||
|
||||
PairPotential::~PairPotential() {};
|
||||
#endif
|
Loading…
Add table
Add a link
Reference in a new issue