[BACKEND] Porting the legacy heuristic rule in assigning shared layout for A/B of MMAv1 (#948)

This commit is contained in:
goostavz
2022-12-06 03:30:23 +08:00
committed by GitHub
parent 99c7e0e008
commit e057c65cf0
2 changed files with 8 additions and 6 deletions

View File

@@ -3035,7 +3035,6 @@ void ConvertLayoutOpConversion::processReplica(
currVal = zext(llvmElemTy, currVal);
else if (isPtr)
currVal = ptrtoint(llvmElemTy, currVal);
valVec = insert_element(vecTy, valVec, currVal, idx_val(v));
}
store(valVec, ptr);
@@ -3143,7 +3142,6 @@ LogicalResult ConvertLayoutOpConversion::lowerBlockedToShared(
triton::gpu::ConvertLayoutOp op, OpAdaptor adaptor,
ConversionPatternRewriter &rewriter) const {
auto loc = op.getLoc();
Value src = op.src();
Value dst = op.result();
auto srcTy = src.getType().cast<RankedTensorType>();