Skip to content

Commit bd2d2b8

Browse files
committed
revert
1 parent 4ac62bb commit bd2d2b8

2 files changed

Lines changed: 0 additions & 19 deletions

File tree

csrc/alias_analysis.cpp

Lines changed: 0 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -288,25 +288,13 @@ void AliasFinder::handle(const SliceOp* slice) {
288288
out, in, Layout(std::move(out_allocation), std::move(out_contiguity)));
289289
}
290290

291-
// Only consider broadcast aliasing when IO tensor is involved.
292-
// Intermediate broadcasts will be fused with other ops and don't need explicit
293-
// alias handling. Limiting to fusion boundaries avoids unnecessary allocation
294-
// domain changes on intermediate tensors, which may trigger transpose scheduler
295-
// when pointwise is preferred. For example, when a normalization kernel is
296-
// segmented, we prefer reduction + pointwise instead of reduction + transpose.
297-
// See SmemPersistentNotSupportedIn3DReduction.
298291
void AliasFinder::handle(const BroadcastOp* bcast) {
299292
auto* in = dynamic_cast<TensorView*>(bcast->in());
300293
if (in == nullptr) {
301294
return;
302295
}
303296
auto* out = bcast->out()->as<TensorView>();
304297

305-
// No alias analysis needed if no IO tensors are involved
306-
if (!out->isFusionOutput() && !in->isFusionInput()) {
307-
return;
308-
}
309-
310298
std::optional<Layout> out_layout =
311299
mapInLayoutToOutRoot(analysis_.preferredLayout(in), in, out);
312300
if (!out_layout.has_value()) {

tests/cpp/test_persistent_buffer.cpp

Lines changed: 0 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -1257,13 +1257,6 @@ TEST_F(PersistentBufferTest, SmemPersistentNotSupportedIn3DReduction) {
12571257
// persistent is not supported yet for 3D reduction.
12581258
EXPECT_TRUE(executor_cache.getMostRecentKernelRuntime()->isSegmented());
12591259

1260-
// expect reduction and pointwise scheduler
1261-
EXPECT_THAT(
1262-
executor_cache.getMostRecentKernelRuntime()->fusionSegments()->groups(),
1263-
UnorderedElementsAre(
1264-
HeuristicIs(SchedulerType::PointWise),
1265-
HeuristicIs(SchedulerType::Reduction)));
1266-
12671260
testValidate(executor_cache.fusion(), cg_outputs, {t0}, __LINE__, __FILE__);
12681261
}
12691262

0 commit comments

Comments
 (0)