[Triton-MLIR][BACKEND] Pass compute capability from the frontend and code cleanup (#961)

2022-12-07 15:03:46 -08:00
parent 4eab9dcedf
commit 18e683d9bb
4 changed files with 17 additions and 20 deletions
--- a/include/triton/Dialect/TritonGPU/IR/TritonGPUOps.td
+++ b/include/triton/Dialect/TritonGPU/IR/TritonGPUOps.td
@@ -32,6 +32,12 @@ def TTG_AsyncWaitOp : TTG_Op<"async_wait"> {
  let arguments = (ins I32Attr:$num);

  let assemblyFormat = "attr-dict";
+
+  let extraClassDeclaration = [{
+    static bool isSupported(int computeCapability) {
+      return computeCapability >= 80;
+    }
+  }];
 }

 // Port Arith_CmpIOp & Arith_CmpFOp & Std_SelectOp to TritonGPU.
@@ -152,7 +158,13 @@ def TTG_InsertSliceAsyncOp : TTG_Op<"insert_slice_async",
  //}];

  let extraClassDeclaration = [{
-      static DenseSet<unsigned> getEligibleLoadByteWidth(int computeCapability);
+    static DenseSet<unsigned> getEligibleLoadByteWidth(int computeCapability) {
+      DenseSet<unsigned> validLoadBytes;
+      if (computeCapability >= 80) {
+        validLoadBytes = {4, 8, 16};
+      }
+      return validLoadBytes;
+    }
  }];

  // The custom parser could be replaced with oilist in LLVM-16