From 8b85f602f74b7993c6f45fc6e4bfb5bda319b6ed Mon Sep 17 00:00:00 2001 From: Tobias Winchen <tobias.winchen@rwth-aachen.de> Date: Tue, 5 Mar 2019 13:14:40 +0000 Subject: [PATCH] Remove stream synchronization from methods to allow memcpy/kernel overlap --- psrdada_cpp/effelsberg/edd/src/DetectorAccumulator.cu | 1 - psrdada_cpp/effelsberg/edd/src/Unpacker.cu | 2 -- 2 files changed, 3 deletions(-) diff --git a/psrdada_cpp/effelsberg/edd/src/DetectorAccumulator.cu b/psrdada_cpp/effelsberg/edd/src/DetectorAccumulator.cu index e4c1b08f..527bfb95 100644 --- a/psrdada_cpp/effelsberg/edd/src/DetectorAccumulator.cu +++ b/psrdada_cpp/effelsberg/edd/src/DetectorAccumulator.cu @@ -57,7 +57,6 @@ void DetectorAccumulator::detect(InputType const& input, OutputType& output) int8_t* output_ptr = thrust::raw_pointer_cast(output.data()); kernels::detect_and_accumulate<<<1024, 1024, 0, _stream>>>( input_ptr, output_ptr, _nchans, nsamps, _tscrunch, _scale, _offset); - CUDA_ERROR_CHECK(cudaStreamSynchronize(_stream)); } } //namespace edd diff --git a/psrdada_cpp/effelsberg/edd/src/Unpacker.cu b/psrdada_cpp/effelsberg/edd/src/Unpacker.cu index 35065838..11c0ac7b 100644 --- a/psrdada_cpp/effelsberg/edd/src/Unpacker.cu +++ b/psrdada_cpp/effelsberg/edd/src/Unpacker.cu @@ -133,7 +133,6 @@ void Unpacker::unpack<12>(InputType const& input, OutputType& output) OutputType::value_type* output_ptr = thrust::raw_pointer_cast(output.data()); kernels::unpack_edd_12bit_to_float32<<< nblocks, EDD_NTHREADS_UNPACK, 0, _stream>>>( input_ptr, output_ptr, input.size()); - CUDA_ERROR_CHECK(cudaStreamSynchronize(_stream)); } template <> @@ -148,7 +147,6 @@ void Unpacker::unpack<8>(InputType const& input, OutputType& output) OutputType::value_type* output_ptr = thrust::raw_pointer_cast(output.data()); kernels::unpack_edd_8bit_to_float32<<< nblocks, EDD_NTHREADS_UNPACK, 0, _stream>>>( input_ptr, output_ptr, input.size()); - CUDA_ERROR_CHECK(cudaStreamSynchronize(_stream)); } } //namespace edd -- GitLab