diff --git a/cuda/CudaPlotPhase3Step3.cu b/cuda/CudaPlotPhase3Step3.cu index c771eb67..c24c42f5 100644 --- a/cuda/CudaPlotPhase3Step3.cu +++ b/cuda/CudaPlotPhase3Step3.cu @@ -277,8 +277,8 @@ void CudaK32PlotPhase3Step3( CudaK32PlotContext& cx ) s3.parksOut.Reset(); // Copy map slice counts (for the next step 2) - CudaErrCheck( cudaMemcpyAsync( cx.hostBucketSlices, cx.devSliceCounts, sizeof( uint32 , 51) * BBCU_BUCKET_COUNT * BBCU_BUCKET_COUNT, - cudaMemcpyDeviceToHost, downloadStream ) ); + CudaErrCheck( cudaMemcpyAsync( cx.hostBucketSlices, cx.devSliceCounts, sizeof( uint32) * BBCU_BUCKET_COUNT * BBCU_BUCKET_COUNT, + cudaMemcpyDeviceToHost, downloadStream ) , 51); CudaErrCheck( cudaStreamSynchronize( downloadStream ) , 52); memcpy( &s3.prunedBucketSlices[0][0], cx.hostBucketSlices, sizeof( uint32 ) * BBCU_BUCKET_COUNT * BBCU_BUCKET_COUNT ); diff --git a/cuda/chacha8.cu b/cuda/chacha8.cu index 0ebead78..61d79a11 100644 --- a/cuda/chacha8.cu +++ b/cuda/chacha8.cu @@ -229,7 +229,7 @@ void GenF1Cuda( CudaK32PlotContext& cx ) } // Copy bucket slices to host - CudaErrCheck( cudaMemcpyAsync( cx.hostBucketSlices, cx.devSliceCounts, sizeof( uint32 , 100) * BBCU_BUCKET_COUNT * BBCU_BUCKET_COUNT, + CudaErrCheck( cudaMemcpyAsync( cx.hostBucketSlices, cx.devSliceCounts, sizeof( uint32) * BBCU_BUCKET_COUNT * BBCU_BUCKET_COUNT, cudaMemcpyDeviceToHost, cx.computeStream ), 999 ); CudaErrCheck( cudaStreamSynchronize( cx.computeStream ) , 101);