@@ -277,7 +277,7 @@ struct AgentRadixSortDownsweep
277277 temp_storage.keys_and_offsets .exchange_keys [ranks[ITEM]] = twiddled_keys[ITEM];
278278 }
279279
280- CTA_SYNC ();
280+ __syncthreads ();
281281
282282#pragma unroll
283283 for (int ITEM = 0 ; ITEM < ITEMS_PER_THREAD; ++ITEM)
@@ -305,7 +305,7 @@ struct AgentRadixSortDownsweep
305305 int (&ranks)[ITEMS_PER_THREAD],
306306 OffsetT valid_items)
307307 {
308- CTA_SYNC ();
308+ __syncthreads ();
309309
310310 ValueExchangeT& exchange_values = temp_storage.exchange_values .Alias ();
311311
@@ -315,7 +315,7 @@ struct AgentRadixSortDownsweep
315315 exchange_values[ranks[ITEM]] = values[ITEM];
316316 }
317317
318- CTA_SYNC ();
318+ __syncthreads ();
319319
320320#pragma unroll
321321 for (int ITEM = 0 ; ITEM < ITEMS_PER_THREAD; ++ITEM)
@@ -342,7 +342,7 @@ struct AgentRadixSortDownsweep
342342 {
343343 BlockLoadKeysT (temp_storage.load_keys ).Load (d_keys_in + block_offset, keys);
344344
345- CTA_SYNC ();
345+ __syncthreads ();
346346 }
347347
348348 /* *
@@ -362,7 +362,7 @@ struct AgentRadixSortDownsweep
362362
363363 BlockLoadKeysT (temp_storage.load_keys ).Load (d_keys_in + block_offset, keys, valid_items, oob_item);
364364
365- CTA_SYNC ();
365+ __syncthreads ();
366366 }
367367
368368 /* *
@@ -409,7 +409,7 @@ struct AgentRadixSortDownsweep
409409 {
410410 BlockLoadValuesT (temp_storage.load_values ).Load (d_values_in + block_offset, values);
411411
412- CTA_SYNC ();
412+ __syncthreads ();
413413 }
414414
415415 /* *
@@ -428,7 +428,7 @@ struct AgentRadixSortDownsweep
428428
429429 BlockLoadValuesT (temp_storage.load_values ).Load (d_values_in + block_offset, values, valid_items);
430430
431- CTA_SYNC ();
431+ __syncthreads ();
432432 }
433433
434434 /* *
@@ -474,7 +474,7 @@ struct AgentRadixSortDownsweep
474474 {
475475 ValueT values[ITEMS_PER_THREAD];
476476
477- CTA_SYNC ();
477+ __syncthreads ();
478478
479479 LoadValues (values, block_offset, valid_items, Int2Type<FULL_TILE>(), Int2Type<LOAD_WARP_STRIPED>());
480480
@@ -520,7 +520,7 @@ struct AgentRadixSortDownsweep
520520 int exclusive_digit_prefix[BINS_TRACKED_PER_THREAD];
521521 BlockRadixRankT (temp_storage.radix_rank ).RankKeys (keys, ranks, digit_extractor (), exclusive_digit_prefix);
522522
523- CTA_SYNC ();
523+ __syncthreads ();
524524
525525// Share exclusive digit prefix
526526#pragma unroll
@@ -534,7 +534,7 @@ struct AgentRadixSortDownsweep
534534 }
535535 }
536536
537- CTA_SYNC ();
537+ __syncthreads ();
538538
539539 // Get inclusive digit prefix
540540 int inclusive_digit_prefix[BINS_TRACKED_PER_THREAD];
@@ -562,7 +562,7 @@ struct AgentRadixSortDownsweep
562562 }
563563 }
564564
565- CTA_SYNC ();
565+ __syncthreads ();
566566
567567// Update global scatter base offsets for each digit
568568#pragma unroll
@@ -577,7 +577,7 @@ struct AgentRadixSortDownsweep
577577 }
578578 }
579579
580- CTA_SYNC ();
580+ __syncthreads ();
581581
582582 // Scatter keys
583583 ScatterKeys<FULL_TILE>(keys, relative_bin_offsets, ranks, valid_items);
@@ -602,7 +602,7 @@ struct AgentRadixSortDownsweep
602602 T items[ITEMS_PER_THREAD];
603603
604604 LoadDirectStriped<BLOCK_THREADS>(threadIdx .x , d_in + block_offset, items);
605- CTA_SYNC ();
605+ __syncthreads ();
606606 StoreDirectStriped<BLOCK_THREADS>(threadIdx .x , d_out + block_offset, items);
607607
608608 block_offset += TILE_ITEMS;
@@ -616,7 +616,7 @@ struct AgentRadixSortDownsweep
616616 T items[ITEMS_PER_THREAD];
617617
618618 LoadDirectStriped<BLOCK_THREADS>(threadIdx .x , d_in + block_offset, items, valid_items);
619- CTA_SYNC ();
619+ __syncthreads ();
620620 StoreDirectStriped<BLOCK_THREADS>(threadIdx .x , d_out + block_offset, items, valid_items);
621621 }
622622 }
@@ -670,7 +670,7 @@ struct AgentRadixSortDownsweep
670670 }
671671 }
672672
673- short_circuit = CTA_SYNC_AND (short_circuit);
673+ short_circuit = __syncthreads_and (short_circuit);
674674 }
675675
676676 /* *
@@ -719,7 +719,7 @@ struct AgentRadixSortDownsweep
719719 }
720720 }
721721
722- short_circuit = CTA_SYNC_AND (short_circuit);
722+ short_circuit = __syncthreads_and (short_circuit);
723723 }
724724
725725 /* *
@@ -744,7 +744,7 @@ struct AgentRadixSortDownsweep
744744 ProcessTile<true >(block_offset);
745745 block_offset += TILE_ITEMS;
746746
747- CTA_SYNC ();
747+ __syncthreads ();
748748 }
749749
750750 // Clean up last partial tile with guarded-I/O
0 commit comments