From 954296ed80ca885871a84fbba1373df6ef6ff0c6 Mon Sep 17 00:00:00 2001
From: psychocrypt <psychocryptHPC@gmail.com>
Date: Wed, 24 Oct 2018 09:57:55 +0200
Subject: [PATCH] NVIDIA: fix wrong number of threads

In the cuda backend for monero we start always twice as much threads as needed.
Those threads are than removed after the AES matrix is copied to the shared memory.
Never the less it is the result of an copy past bug.

- start correct number of threads for `monero`
---
 xmrstak/backend/nvidia/nvcc_code/cuda_core.cu | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/xmrstak/backend/nvidia/nvcc_code/cuda_core.cu b/xmrstak/backend/nvidia/nvcc_code/cuda_core.cu
index 7742e74..fa7e093 100644
--- a/xmrstak/backend/nvidia/nvcc_code/cuda_core.cu
+++ b/xmrstak/backend/nvidia/nvcc_code/cuda_core.cu
@@ -734,7 +734,7 @@ void cryptonight_core_gpu_hash(nvid_ctx* ctx, uint32_t nonce)
 {
 	dim3 grid( ctx->device_blocks );
 	dim3 block( ctx->device_threads );
-	dim3 block2( ctx->device_threads << 2 );
+	dim3 block2( ctx->device_threads << 1 );
 	dim3 block4( ctx->device_threads << 2 );
 	dim3 block8( ctx->device_threads << 3 );
 
-- 
GitLab