forked from lijiext/lammps
Kokkos bugfix
git-svn-id: svn://svn.icms.temple.edu/lammps-ro/trunk@14051 f3b2605a-c512-4ea7-a41b-209d697bcdaa
This commit is contained in:
parent
d472396a46
commit
cb971f0166
|
@ -1132,8 +1132,8 @@ KOKKOS_INLINE_FUNCTION
|
||||||
Random_XorShift64<Kokkos::Cuda> Random_XorShift64_Pool<Kokkos::Cuda>::get_state() const {
|
Random_XorShift64<Kokkos::Cuda> Random_XorShift64_Pool<Kokkos::Cuda>::get_state() const {
|
||||||
#ifdef __CUDA_ARCH__
|
#ifdef __CUDA_ARCH__
|
||||||
const int i_offset = (threadIdx.x*blockDim.y + threadIdx.y)*blockDim.z+threadIdx.z;
|
const int i_offset = (threadIdx.x*blockDim.y + threadIdx.y)*blockDim.z+threadIdx.z;
|
||||||
int i = ((blockIdx.x*gridDim.y+blockIdx.y)*gridDim.z + blockIdx.z) *
|
int i = (((blockIdx.x*gridDim.y+blockIdx.y)*gridDim.z + blockIdx.z) *
|
||||||
blockDim.x*blockDim.y*blockDim.z + i_offset;
|
blockDim.x*blockDim.y*blockDim.z + i_offset)%num_states_;
|
||||||
while(Kokkos::atomic_compare_exchange(&locks_(i),0,1)) {
|
while(Kokkos::atomic_compare_exchange(&locks_(i),0,1)) {
|
||||||
i+=blockDim.x*blockDim.y*blockDim.z;
|
i+=blockDim.x*blockDim.y*blockDim.z;
|
||||||
if(i>=num_states_) {i = i_offset;}
|
if(i>=num_states_) {i = i_offset;}
|
||||||
|
@ -1168,8 +1168,8 @@ KOKKOS_INLINE_FUNCTION
|
||||||
Random_XorShift1024<Kokkos::Cuda> Random_XorShift1024_Pool<Kokkos::Cuda>::get_state() const {
|
Random_XorShift1024<Kokkos::Cuda> Random_XorShift1024_Pool<Kokkos::Cuda>::get_state() const {
|
||||||
#ifdef __CUDA_ARCH__
|
#ifdef __CUDA_ARCH__
|
||||||
const int i_offset = (threadIdx.x*blockDim.y + threadIdx.y)*blockDim.z+threadIdx.z;
|
const int i_offset = (threadIdx.x*blockDim.y + threadIdx.y)*blockDim.z+threadIdx.z;
|
||||||
int i = ((blockIdx.x*gridDim.y+blockIdx.y)*gridDim.z + blockIdx.z) *
|
int i = (((blockIdx.x*gridDim.y+blockIdx.y)*gridDim.z + blockIdx.z) *
|
||||||
blockDim.x*blockDim.y*blockDim.z + i_offset;
|
blockDim.x*blockDim.y*blockDim.z + i_offset)%num_states_;
|
||||||
while(Kokkos::atomic_compare_exchange(&locks_(i),0,1)) {
|
while(Kokkos::atomic_compare_exchange(&locks_(i),0,1)) {
|
||||||
i+=blockDim.x*blockDim.y*blockDim.z;
|
i+=blockDim.x*blockDim.y*blockDim.z;
|
||||||
if(i>=num_states_) {i = i_offset;}
|
if(i>=num_states_) {i = i_offset;}
|
||||||
|
|
Loading…
Reference in New Issue