summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorpsychocrypt <psychocrypt@users.noreply.github.com>2017-11-23 21:25:25 +0100
committerpsychocrypt <psychocrypt@users.noreply.github.com>2017-11-23 21:25:25 +0100
commit43812b36d763259216b288c62ea343e131510244 (patch)
tree50d5c30b0838e2cbc141da2305af64bc4cfb5850
parentfb6baa5d46cfa3d5e2b835544ea83e736b6903e4 (diff)
downloadxmr-stak-43812b36d763259216b288c62ea343e131510244.zip
xmr-stak-43812b36d763259216b288c62ea343e131510244.tar.gz
fix CUDA launch bounds usage
fix #191 lauch bounds must be placed before the return type but after the template paramater
-rw-r--r--xmrstak/backend/nvidia/nvcc_code/cuda_core.cu2
1 files changed, 1 insertions, 1 deletions
diff --git a/xmrstak/backend/nvidia/nvcc_code/cuda_core.cu b/xmrstak/backend/nvidia/nvcc_code/cuda_core.cu
index a92fa8c..dba6676 100644
--- a/xmrstak/backend/nvidia/nvcc_code/cuda_core.cu
+++ b/xmrstak/backend/nvidia/nvcc_code/cuda_core.cu
@@ -167,10 +167,10 @@ __forceinline__ __device__ uint32_t shuffle(volatile uint32_t* ptr,const uint32_
#endif
}
+template<size_t ITERATIONS, uint32_t THREAD_SHIFT, uint32_t MASK>
#ifdef XMR_STAK_THREADS
__launch_bounds__( XMR_STAK_THREADS * 4 )
#endif
-template<size_t ITERATIONS, uint32_t THREAD_SHIFT, uint32_t MASK>
__global__ void cryptonight_core_gpu_phase2( int threads, int bfactor, int partidx, uint32_t * d_long_state, uint32_t * d_ctx_a, uint32_t * d_ctx_b )
{
__shared__ uint32_t sharedMemory[1024];
OpenPOWER on IntegriCloud