Skip to content

Commit 4e4d8d3

Browse files
Fix falling back to SM90 tunings
1 parent a5e771e commit 4e4d8d3

File tree

1 file changed

+18
-32
lines changed

1 file changed

+18
-32
lines changed

cub/cub/device/dispatch/tuning/tuning_histogram.cuh

Lines changed: 18 additions & 32 deletions
Original file line numberDiff line numberDiff line change
@@ -151,23 +151,17 @@ struct sm100_tuning<1, SampleT, 1, 1, counter_size::_4, primitive_sample::yes, s
151151
static constexpr int vec_size = 1 << 2;
152152
};
153153

154-
// same as base
155-
template <class SampleT>
156-
struct sm100_tuning<1, SampleT, 1, 1, counter_size::_4, primitive_sample::yes, sample_size::_2>
157-
: sm90_tuning<SampleT, 1, 1, counter_size::_4, primitive_sample::yes, sample_size::_2>
158-
{};
154+
// same as SM90
155+
// template <class SampleT>
156+
// struct sm100_tuning<1, SampleT, 1, 1, counter_size::_4, primitive_sample::yes, sample_size::_2> {};
159157

160-
// same as base
161-
template <class SampleT>
162-
struct sm100_tuning<1, SampleT, 1, 1, counter_size::_4, primitive_sample::yes, sample_size::_4>
163-
: sm90_tuning<SampleT, 1, 1, counter_size::_4, primitive_sample::yes, sample_size::_4>
164-
{};
158+
// same as SM90
159+
// template <class SampleT>
160+
// struct sm100_tuning<1, SampleT, 1, 1, counter_size::_4, primitive_sample::yes, sample_size::_4> {};
165161

166-
// same as base
167-
template <class SampleT>
168-
struct sm100_tuning<1, SampleT, 1, 1, counter_size::_4, primitive_sample::yes, sample_size::_8>
169-
: sm90_tuning<SampleT, 1, 1, counter_size::_4, primitive_sample::yes, sample_size::_8>
170-
{};
162+
// same as SM90
163+
// template <class SampleT>
164+
// struct sm100_tuning<1, SampleT, 1, 1, counter_size::_4, primitive_sample::yes, sample_size::_8> {};
171165

172166
// range
173167
template <class SampleT>
@@ -184,11 +178,9 @@ struct sm100_tuning<0, SampleT, 1, 1, counter_size::_4, primitive_sample::yes, s
184178
static constexpr int vec_size = 1 << 2;
185179
};
186180

187-
// same as base
188-
template <class SampleT>
189-
struct sm100_tuning<0, SampleT, 1, 1, counter_size::_4, primitive_sample::yes, sample_size::_2>
190-
: sm90_tuning<SampleT, 1, 1, counter_size::_4, primitive_sample::yes, sample_size::_2>
191-
{};
181+
// same as SM90
182+
// template <class SampleT>
183+
// struct sm100_tuning<0, SampleT, 1, 1, counter_size::_4, primitive_sample::yes, sample_size::_2> {};
192184

193185
template <class SampleT>
194186
struct sm100_tuning<0, SampleT, 1, 1, counter_size::_4, primitive_sample::yes, sample_size::_4>
@@ -234,22 +226,16 @@ struct sm100_tuning<1, SampleT, 4, 3, counter_size::_4, primitive_sample::yes, s
234226
};
235227

236228
// same as base
237-
template <class SampleT>
238-
struct sm100_tuning<1, SampleT, 4, 3, counter_size::_4, primitive_sample::yes, sample_size::_2>
239-
: sm90_tuning<SampleT, 1, 1, counter_size::_4, primitive_sample::yes, sample_size::_2>
240-
{};
229+
// template <class SampleT>
230+
// struct sm100_tuning<1, SampleT, 4, 3, counter_size::_4, primitive_sample::yes, sample_size::_2> {};
241231

242232
// same as base
243-
template <class SampleT>
244-
struct sm100_tuning<1, SampleT, 4, 3, counter_size::_4, primitive_sample::yes, sample_size::_4>
245-
: sm90_tuning<SampleT, 1, 1, counter_size::_4, primitive_sample::yes, sample_size::_4>
246-
{};
233+
// template <class SampleT>
234+
// struct sm100_tuning<1, SampleT, 4, 3, counter_size::_4, primitive_sample::yes, sample_size::_4> {};
247235

248236
// same as base
249-
template <class SampleT>
250-
struct sm100_tuning<1, SampleT, 4, 3, counter_size::_4, primitive_sample::yes, sample_size::_8>
251-
: sm90_tuning<SampleT, 1, 1, counter_size::_4, primitive_sample::yes, sample_size::_8>
252-
{};
237+
// template <class SampleT>
238+
// struct sm100_tuning<1, SampleT, 4, 3, counter_size::_4, primitive_sample::yes, sample_size::_8> {};
253239

254240
// multi.range
255241
template <class SampleT>

0 commit comments

Comments
 (0)