From 2afa84d4ca0f8abb18cc06d8fb8f2013f289a8d6 Mon Sep 17 00:00:00 2001 From: Georgy Evtushenko Date: Sat, 13 May 2023 11:14:51 +0400 Subject: [PATCH] Tune radix sort keys for U8/U16 and 64-bit offsets --- cub/device/dispatch/dispatch_radix_sort.cuh | 2 ++ 1 file changed, 2 insertions(+) diff --git a/cub/device/dispatch/dispatch_radix_sort.cuh b/cub/device/dispatch/dispatch_radix_sort.cuh index d4fb19658..56da93992 100644 --- a/cub/device/dispatch/dispatch_radix_sort.cuh +++ b/cub/device/dispatch/dispatch_radix_sort.cuh @@ -629,7 +629,9 @@ struct sm90_small_key_tuning // keys template <> struct sm90_small_key_tuning<1, 0, 4> { static constexpr int threads = 512; static constexpr int items = 19; }; +template <> struct sm90_small_key_tuning<1, 0, 8> { static constexpr int threads = 512; static constexpr int items = 19; }; template <> struct sm90_small_key_tuning<2, 0, 4> { static constexpr int threads = 512; static constexpr int items = 19; }; +template <> struct sm90_small_key_tuning<2, 0, 8> { static constexpr int threads = 512; static constexpr int items = 19; }; // pairs 8:xx template <> struct sm90_small_key_tuning<1, 1, 4> { static constexpr int threads = 512; static constexpr int items = 15; };