Permalink
Browse files

a little bit more speed for sia

  • Loading branch information...
1 parent dc1e25e commit 09b7388b3ab1ba1293b3810842ce084c577052ed @KlausT committed Oct 27, 2016
Showing with 4 additions and 3 deletions.
  1. +1 −1 Sia/cuda_sia.cu
  2. +3 −2 Sia/sia.h
View
@@ -54,7 +54,7 @@ __device__ unsigned int numberofresults;
__global__ void __launch_bounds__(blocksize, 3) siakernel(uint32_t * __restrict__ nonceOut, uint64_t target, uint64_t startnonce)
{
uint64_t v[16];
- uint64_t start = startnonce + (blockDim.x * blockIdx.x + threadIdx.x)*npt;
+ const uint64_t start = startnonce + (blockDim.x * blockIdx.x + threadIdx.x)*npt;
numberofresults = 0;
View
@@ -1,8 +1,9 @@
#pragma once
#define MAXRESULTS 8
-#define npt 128
-#define blocksize 256
+
+#define npt 1
+#define blocksize 320
void sia_gpu_init(int thr_id);
void sia_precalc(cudaStream_t cudastream, const uint64_t *blockHeader);

0 comments on commit 09b7388

Please sign in to comment.