Skip to content

Commit

Permalink
Default F64, I32 workload for non_trivial_runs
Browse files Browse the repository at this point in the history
  • Loading branch information
gonidelis authored and bernhardmgruber committed Feb 5, 2025
1 parent 5a818e2 commit d21e758
Showing 1 changed file with 6 additions and 0 deletions.
6 changes: 6 additions & 0 deletions cub/cub/device/dispatch/tuning/tuning_run_length_encode.cuh
Original file line number Diff line number Diff line change
Expand Up @@ -569,6 +569,12 @@ struct sm100_tuning<LengthT, KeyT, primitive_length::yes, primitive_key::yes, le
using delay_constructor = detail::exponential_backoff_constructor_t<28, 520>;
};

// need to default it back explicitly because it regresses
template <class LengthT>
struct sm100_tuning<LengthT, double, primitive_length::yes, primitive_key::yes, length_size::_4, key_size::_8>
: sm90_tuning<LengthT, double, primitive_length::yes, primitive_key::yes, length_size::_4, key_size::_8>
{};

// TODO(gonidelis): Tune for I128.
#if CUB_IS_INT128_ENABLED
// template <class LengthT>
Expand Down

0 comments on commit d21e758

Please sign in to comment.