Skip to content

Commit 2f03db7

Browse files
committed
static bdimx, unswitch persistent batch
1 parent 3521be6 commit 2f03db7

File tree

1 file changed

+3
-4
lines changed

1 file changed

+3
-4
lines changed

csrc/scheduler/reduction_utils.cpp

Lines changed: 3 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -200,15 +200,14 @@ TensorView* scheduleReductionTV(
200200
if (rparams->static_bdimx) {
201201
// [R, TIDx, Vect]
202202
reduction_tv->split(inner_reduce_axis, rparams->lparams.bdimx());
203-
// [R, US, TIDx, Vect]
204-
outer_unswitch(inner_reduce_axis + 1);
205-
reduction_tv->axis(inner_reduce_axis + 2)
203+
// [R, TIDx, Vect]
204+
reduction_tv->axis(inner_reduce_axis + 1)
206205
->parallelize(rparams->block_dim_inner_reduction);
207206
} else {
208207
reduction_tv->split(
209208
outer_i++, rparams->batches_per_block_inner_reduction, false);
210-
outer_unswitch(outer_i++);
211209
}
210+
outer_unswitch(outer_i++);
212211

213212
if (!rparams->vectorize_inner_reduction &&
214213
rparams->unroll_factor_inner_reduction > 1) {

0 commit comments

Comments
 (0)