From a7f414caecaed7da76bcf7c53cd17a0b07c06f17 Mon Sep 17 00:00:00 2001 From: Soeren Schoenbrod Date: Fri, 19 May 2023 21:59:26 +0200 Subject: [PATCH] Only start num_samples_left threads instead of size(signal, 1) --- src/gpu_downconvert_and_correlate.jl | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/gpu_downconvert_and_correlate.jl b/src/gpu_downconvert_and_correlate.jl index 49e51d7..e2ac8ba 100644 --- a/src/gpu_downconvert_and_correlate.jl +++ b/src/gpu_downconvert_and_correlate.jl @@ -170,8 +170,8 @@ function downconvert_and_correlate!( ) where M # Assume 1024 to be the max number of threads # TODO: Evaluate this at run time - threads = min(size(signal, 1), 1024) - blocks = cld(size(signal, 1), threads) + threads = min(num_samples_left, 1024) + blocks = cld(num_samples_left, threads) num_correlators = size(downconverted_and_decoded_signal, 3) @cuda threads=threads blocks=blocks downconvert_and_decode_prn_kernel!( downconverted_and_decoded_signal,