Skip to content

Commit c8e90bb

Browse files
committed
at this problem size (FFT 16x16), cudaDeviceSynch is almost as expensive as an FFT. let's not time device synchronize, since cufft clearly is blocking here anyway
1 parent 86eafe2 commit c8e90bb

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

Diff for: cufft_multiple_streams/main.cu

+1-1
Original file line numberDiff line numberDiff line change
@@ -41,7 +41,7 @@ void cufftForward_streams_experiment(){
4141
for(int i=0; i<number_of_FFTs; i++){
4242
CHECK_CUFFT(cufftExecR2C(forwardPlan[i], d_in[i], d_freq[i]));
4343
}
44-
CHECK_CUDART(cudaDeviceSynchronize());
44+
//CHECK_CUDART(cudaDeviceSynchronize());
4545
double forwardTime = read_timer() - start;
4646
printf("time for %d forward FFTs in streams = %f \n", number_of_FFTs, forwardTime);
4747
printf("avg time per FFT = %f \n", forwardTime/number_of_FFTs);

0 commit comments

Comments
 (0)