[Triton-MLIR][OPTIMIZER] Add ExtElemwiseOp to expensive_to_remat list
This commit is contained in:
@@ -200,7 +200,7 @@ inline bool expensive_to_remat(Operation *op) {
|
|||||||
return true;
|
return true;
|
||||||
if (isa<triton::gpu::ExtractSliceOp, triton::gpu::AllocTensorOp,
|
if (isa<triton::gpu::ExtractSliceOp, triton::gpu::AllocTensorOp,
|
||||||
triton::gpu::InsertSliceAsyncOp, triton::LoadOp, triton::StoreOp,
|
triton::gpu::InsertSliceAsyncOp, triton::LoadOp, triton::StoreOp,
|
||||||
triton::DotOp>(op))
|
triton::DotOp, triton::ExtElemwiseOp>(op))
|
||||||
return true;
|
return true;
|
||||||
if (isa<scf::YieldOp, scf::ForOp>(op))
|
if (isa<scf::YieldOp, scf::ForOp>(op))
|
||||||
return true;
|
return true;
|
||||||
@@ -623,4 +623,4 @@ public:
|
|||||||
|
|
||||||
std::unique_ptr<Pass> mlir::createTritonGPUCombineOpsPass() {
|
std::unique_ptr<Pass> mlir::createTritonGPUCombineOpsPass() {
|
||||||
return std::make_unique<TritonGPUCombineOpsPass>();
|
return std::make_unique<TritonGPUCombineOpsPass>();
|
||||||
}
|
}
|
||||||
|
Reference in New Issue
Block a user