[BUILD] Remove compilation warnings

2021-03-24 01:24:50 -04:00
parent b352bc79e3
commit 5ba5a77561
6 changed files with 26 additions and 59 deletions
--- a/include/triton/runtime/function.h
+++ b/include/triton/runtime/function.h
@@ -92,12 +92,6 @@ void add_arg(std::stringstream& ss, T arg) {
 /* ------------------------- */
 /* ------------------------- */

-enum asm_mode_t {
-  ASM_LLIR,
-  ASM_NV_PTX,
-  ASM_NV_SASS
-};
-
 class kernel{
 public:
  typedef std::vector<size_t> grid_t;
@@ -111,7 +105,7 @@ public:
 public:
  kernel(const std::string& src, const options_t& opt, driver::device *device, const std::map<int, triton::ir::attribute> &attrs = {});
  void operator()(const std::string& args, driver::stream *stream, const grid_t& grid) const;
-  std::string get_asm(asm_mode_t mode);
+  std::string get_asm(const std::string &mode);

 public:
  const options_t opt;
--- a/lib/codegen/selection/generator.cc
+++ b/lib/codegen/selection/generator.cc
@@ -28,7 +28,7 @@ using namespace llvm;
 #define f16_ty               builder_->getHalfTy()
 #define f32_ty               builder_->getFloatTy()
 #define i32_ty               builder_->getInt32Ty()
-#define vec_ty(...)          VectorType::get(__VA_ARGS__)
+#define vec_ty(type, num_el) VectorType::get(type, num_el, false)
 #define ptr_ty(...)          PointerType::get(__VA_ARGS__)
 // constants
 #define i32(...)             builder_->getInt32(__VA_ARGS__)
--- a/lib/runtime/function.cc
+++ b/lib/runtime/function.cc
@@ -212,44 +212,23 @@ void kernel::operator()(const std::string& args, driver::stream *stream, const s
  stream->enqueue(&*ker_, grid, {(size_t)opt.num_warps * 32, 1, 1}, (void*)args.data(), args.size(), shared_mem_);
 }

-std::string kernel::get_asm(asm_mode_t mode) {
-  switch(mode){
-      case ASM_LLIR:{
-        return  ((driver::cu_module*)mod_.get())->llir();
-      }
-      case ASM_NV_PTX:
-      case ASM_NV_SASS:{
-        std::string ptx = ((driver::cu_module*)mod_.get())->ptx();
-        // SASS
-        std::string input = std::tmpnam(nullptr);
-        std::string output = std::tmpnam(nullptr);
-        std::ofstream ofs(input);
-        ofs << ptx;
-        ofs.close();
-        if(mode == ASM_NV_PTX)
-          return ptx;
-        std::string cmd;
-        int err;
-        // compile ptx
-        driver::cu_device* cu_device = (driver::cu_device*)dev_;
-        cmd = "ptxas --gpu-name=sm_" + std::to_string(cu_device->compute_capability()) + " " + input + " -o " + input + ".o";
-        err = system(cmd.c_str());
-        // disassemble
-        cmd = "cuobjdump --dump-sass " + input + ".o >> " + output;
-        err = system(cmd.c_str());
-        std::regex comment(" *\\/\\* 0x[0-9a-f]+ \\*\\/");
-        std::string to_delete = "                                                                                           /*";
-        std::ifstream ifs(output);
-        std::string line;
-        std::string sass;
-        while(std::getline(ifs, line))
-          if(!std::regex_match(line, comment))
-            sass += line + "\n";
-        return sass;
-      }
-      default:
-        return "";
+std::string kernel::get_asm(const std::string& mode) {
+  std::vector<std::string> modes = {"llir", "ptx"};
+  if(std::find(modes.begin(), modes.end(), mode) == modes.end()){
+    std::string err = "Unrecognized mode. Supported values are: ";
+    for(std::string m: modes){
+      if(m != modes[0])
+        err += ", ";
+      err += m;
    }
+    throw std::runtime_error(err);
+  }
+  if(mode == "llir")
+      return ((driver::cu_module*)mod_.get())->llir();
+  if(mode == "ptx")
+      return ((driver::cu_module*)mod_.get())->ptx();
+  assert(false);
+  return "";
 }
 /* --------------------------------- */
 /* --------------------------------- */
--- a/python/src/triton.cc
+++ b/python/src/triton.cc
@@ -127,10 +127,6 @@ void init_triton_runtime(py::module &&m) {
      .value("float", rt::FLOAT_T)
      .value("double", rt::DOUBLE_T)
      .value("buffer", rt::BUFFER_T);
-  // assembly mode
-  py::enum_<rt::asm_mode_t>(m, "asm_mode")
-      .value("ptx", rt::ASM_NV_PTX)
-      .value("sass", rt::ASM_NV_SASS);
  // compilation options
  py::class_<rt::options_t>(m, "options", py::dynamic_attr())
      .def(py::init<>())
@@ -142,7 +138,8 @@ void init_triton_runtime(py::module &&m) {
  //  kernel
  py::class_<rt::kernel>(m, "kernel")
      .def("__call__", &rt::kernel::operator())
-      .def_readonly("opt", &rt::kernel::opt);
+      .def_readonly("opt", &rt::kernel::opt)
+      .def("asm", &rt::kernel::get_asm);
  // tune conf
  py::class_<rt::config>(m, "config")
      .def(py::init<std::map<std::string, std::string>, int>(),
--- a/python/triton/kernel.py
+++ b/python/triton/kernel.py
@@ -6,14 +6,9 @@ import torch
 import triton._C.libtriton.triton as _triton

 codes = {
-    _triton.runtime.arg_type.int1: 'B',
-    _triton.runtime.arg_type.int8: 'B',
-    _triton.runtime.arg_type.int32: 'I',
-    _triton.runtime.arg_type.int64: 'Q',
-    _triton.runtime.arg_type.half: 'H',
-    _triton.runtime.arg_type.float: 'f',
-    _triton.runtime.arg_type.double: 'd',
-    _triton.runtime.arg_type.buffer: 'P'
+    _triton.runtime.arg_type.int1: 'B', _triton.runtime.arg_type.int8: 'B', _triton.runtime.arg_type.int32: 'I',
+    _triton.runtime.arg_type.int64: 'Q', _triton.runtime.arg_type.half: 'H', _triton.runtime.arg_type.float: 'f',
+    _triton.runtime.arg_type.double: 'd', _triton.runtime.arg_type.buffer: 'P'
 }


--- a/python/triton/testing.py
+++ b/python/triton/testing.py
@@ -3,8 +3,10 @@ import os

 try:
    import triton._C.libtriton.cutlass as _cutlass
+    has_cutlass = True
 except ImportError:
    _cutlass = None
+    has_cutlass = False


 def sparsify_tensor(x, mask, block):
@@ -44,7 +46,7 @@ def mask_tensor(x, mask, block, value=0):
    return ret


-def allclose(x, y):
+def allclose(x, y, tol=1e-2):
    assert x.dtype == y.dtype
    diff = abs(x - y)
    x_max = torch.max(x)