diff --git a/benchmarks/bench/partition/flagged.cu b/benchmarks/bench/partition/flagged.cu index 7c855c831..185564048 100644 --- a/benchmarks/bench/partition/flagged.cu +++ b/benchmarks/bench/partition/flagged.cu @@ -34,7 +34,7 @@ // %RANGE% TUNE_ITEMS_PER_THREAD ipt 7:24:1 // %RANGE% TUNE_THREADS_PER_BLOCK tpb 128:1024:32 // %RANGE% TUNE_MAGIC_NS ns 0:2048:4 -// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:6:1 +// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:7:1 // %RANGE% TUNE_L2_WRITE_LATENCY_NS l2w 0:1200:5 constexpr bool keep_rejects = true; diff --git a/benchmarks/bench/partition/if.cu b/benchmarks/bench/partition/if.cu index 55b59c91d..d28dfdc92 100644 --- a/benchmarks/bench/partition/if.cu +++ b/benchmarks/bench/partition/if.cu @@ -34,7 +34,7 @@ // %RANGE% TUNE_ITEMS_PER_THREAD ipt 7:24:1 // %RANGE% TUNE_THREADS_PER_BLOCK tpb 128:1024:32 // %RANGE% TUNE_MAGIC_NS ns 0:2048:4 -// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:6:1 +// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:7:1 // %RANGE% TUNE_L2_WRITE_LATENCY_NS l2w 0:1200:5 constexpr bool keep_rejects = true; diff --git a/benchmarks/bench/reduce/by_key.cu b/benchmarks/bench/reduce/by_key.cu index d6daedd81..7e466487e 100644 --- a/benchmarks/bench/reduce/by_key.cu +++ b/benchmarks/bench/reduce/by_key.cu @@ -34,7 +34,7 @@ // %RANGE% TUNE_TRANSPOSE trp 0:1:1 // %RANGE% TUNE_LOAD ld 0:1:1 // %RANGE% TUNE_MAGIC_NS ns 0:2048:4 -// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:6:1 +// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:7:1 // %RANGE% TUNE_L2_WRITE_LATENCY_NS l2w 0:1200:5 #if !TUNE_BASE diff --git a/benchmarks/bench/run_length_encode/encode.cu b/benchmarks/bench/run_length_encode/encode.cu index a0c10aca7..286c1da8c 100644 --- a/benchmarks/bench/run_length_encode/encode.cu +++ b/benchmarks/bench/run_length_encode/encode.cu @@ -34,7 +34,7 @@ // %RANGE% TUNE_TRANSPOSE trp 0:1:1 // %RANGE% TUNE_LOAD ld 0:1:1 // %RANGE% TUNE_MAGIC_NS ns 0:2048:4 -// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:6:1 +// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:7:1 // %RANGE% TUNE_L2_WRITE_LATENCY_NS l2w 0:1200:5 #if !TUNE_BASE diff --git a/benchmarks/bench/run_length_encode/non_trivial_runs.cu b/benchmarks/bench/run_length_encode/non_trivial_runs.cu index ae4441f94..a0c17e78e 100644 --- a/benchmarks/bench/run_length_encode/non_trivial_runs.cu +++ b/benchmarks/bench/run_length_encode/non_trivial_runs.cu @@ -35,7 +35,7 @@ // %RANGE% TUNE_TIME_SLICING ts 0:1:1 // %RANGE% TUNE_LOAD ld 0:1:1 // %RANGE% TUNE_MAGIC_NS ns 0:2048:4 -// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:6:1 +// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:7:1 // %RANGE% TUNE_L2_WRITE_LATENCY_NS l2w 0:1200:5 #if !TUNE_BASE diff --git a/benchmarks/bench/scan/exclusive/by_key.cu b/benchmarks/bench/scan/exclusive/by_key.cu index 818b02797..e8743f1f8 100644 --- a/benchmarks/bench/scan/exclusive/by_key.cu +++ b/benchmarks/bench/scan/exclusive/by_key.cu @@ -32,7 +32,7 @@ // %RANGE% TUNE_ITEMS ipt 7:24:1 // %RANGE% TUNE_THREADS tpb 128:1024:32 // %RANGE% TUNE_MAGIC_NS ns 0:2048:4 -// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:6:1 +// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:7:1 // %RANGE% TUNE_L2_WRITE_LATENCY_NS l2w 0:1200:5 // %RANGE% TUNE_TRANSPOSE trp 0:1:1 // %RANGE% TUNE_LOAD ld 0:2:1 diff --git a/benchmarks/bench/scan/exclusive/max.cu b/benchmarks/bench/scan/exclusive/max.cu index b7e8bec17..599a0f3b4 100644 --- a/benchmarks/bench/scan/exclusive/max.cu +++ b/benchmarks/bench/scan/exclusive/max.cu @@ -28,7 +28,7 @@ // %RANGE% TUNE_ITEMS ipt 7:24:1 // %RANGE% TUNE_THREADS tpb 128:1024:32 // %RANGE% TUNE_MAGIC_NS ns 0:2048:4 -// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:6:1 +// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:7:1 // %RANGE% TUNE_L2_WRITE_LATENCY_NS l2w 0:1200:5 // %RANGE% TUNE_TRANSPOSE trp 0:1:1 // %RANGE% TUNE_LOAD ld 0:2:1 diff --git a/benchmarks/bench/scan/exclusive/sum.cu b/benchmarks/bench/scan/exclusive/sum.cu index d0f824f1c..ca8bfe469 100644 --- a/benchmarks/bench/scan/exclusive/sum.cu +++ b/benchmarks/bench/scan/exclusive/sum.cu @@ -30,7 +30,7 @@ // %RANGE% TUNE_ITEMS ipt 7:24:1 // %RANGE% TUNE_THREADS tpb 128:1024:32 // %RANGE% TUNE_MAGIC_NS ns 0:2048:4 -// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:6:1 +// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:7:1 // %RANGE% TUNE_L2_WRITE_LATENCY_NS l2w 0:1200:5 // %RANGE% TUNE_TRANSPOSE trp 0:1:1 // %RANGE% TUNE_LOAD ld 0:2:1 diff --git a/benchmarks/bench/select/flagged.cu b/benchmarks/bench/select/flagged.cu index 9e4fa47d4..dc59450be 100644 --- a/benchmarks/bench/select/flagged.cu +++ b/benchmarks/bench/select/flagged.cu @@ -35,7 +35,7 @@ // %RANGE% TUNE_ITEMS_PER_THREAD ipt 7:24:1 // %RANGE% TUNE_THREADS_PER_BLOCK tpb 128:1024:32 // %RANGE% TUNE_MAGIC_NS ns 0:2048:4 -// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:6:1 +// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:7:1 // %RANGE% TUNE_L2_WRITE_LATENCY_NS l2w 0:1200:5 constexpr bool keep_rejects = false; diff --git a/benchmarks/bench/select/if.cu b/benchmarks/bench/select/if.cu index 5eee9cb1a..42bbe028c 100644 --- a/benchmarks/bench/select/if.cu +++ b/benchmarks/bench/select/if.cu @@ -36,7 +36,7 @@ // %RANGE% TUNE_ITEMS_PER_THREAD ipt 7:24:1 // %RANGE% TUNE_THREADS_PER_BLOCK tpb 128:1024:32 // %RANGE% TUNE_MAGIC_NS ns 0:2048:4 -// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:6:1 +// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:7:1 // %RANGE% TUNE_L2_WRITE_LATENCY_NS l2w 0:1200:5 constexpr bool keep_rejects = false; diff --git a/benchmarks/bench/select/unique_by_key.cu b/benchmarks/bench/select/unique_by_key.cu index 11a52b655..80ca4aea9 100644 --- a/benchmarks/bench/select/unique_by_key.cu +++ b/benchmarks/bench/select/unique_by_key.cu @@ -34,7 +34,7 @@ // %RANGE% TUNE_TRANSPOSE trp 0:1:1 // %RANGE% TUNE_LOAD ld 0:1:1 // %RANGE% TUNE_MAGIC_NS ns 0:2048:4 -// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:6:1 +// %RANGE% TUNE_DELAY_CONSTRUCTOR_ID dcid 0:7:1 // %RANGE% TUNE_L2_WRITE_LATENCY_NS l2w 0:1200:5 #if !TUNE_BASE diff --git a/benchmarks/nvbench_helper/look_back_helper.cuh b/benchmarks/nvbench_helper/look_back_helper.cuh index 670a4b056..b1836afe7 100644 --- a/benchmarks/nvbench_helper/look_back_helper.cuh +++ b/benchmarks/nvbench_helper/look_back_helper.cuh @@ -36,6 +36,7 @@ #endif using delay_constructors = nvbench::type_list< + cub::detail::no_delay_constructor_t, cub::detail::fixed_delay_constructor_t, cub::detail::exponential_backoff_constructor_t, cub::detail::exponential_backoff_jitter_constructor_t,