Skip to content

Commit

Permalink
Reduce register pressure
Browse files Browse the repository at this point in the history
  • Loading branch information
vmarkovtsev committed Nov 10, 2016
1 parent fc3374d commit 19bc74d
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions kernel.cu
Original file line number Diff line number Diff line change
Expand Up @@ -42,8 +42,8 @@ __global__ void weighted_minhash_cuda(
const uint32_t sample_offset = sample_index * sample_delta;
const uint32_t samples = blockDim.x * sample_delta;
extern __shared__ float shmem[];
float *lnmins = &shmem[(threadIdx.y * blockDim.x + sample_index) * 3 * sample_delta];
uint2 *dtmins = reinterpret_cast<uint2 *>(lnmins + sample_delta);
float *volatile lnmins = &shmem[(threadIdx.y * blockDim.x + sample_index) * 3 * sample_delta];
uint2 *volatile dtmins = reinterpret_cast<uint2 *>(lnmins + sample_delta);
int32_t row = -1;
for (uint32_t index = 0, border = 0;; index++) {
if (index >= border) {
Expand Down

0 comments on commit 19bc74d

Please sign in to comment.