[FRONTEND] Make triton.compile work without a cuda context (#708)

This allows compiling in a subprocess. I'm not seeing a ton of speedup from this, but figure it is a good change anyway.
2022-09-24 13:41:47 -07:00
parent 3ac929b48b
commit 998fd5f9af
4 changed files with 53 additions and 14 deletions
--- a/lib/driver/llvm.cc
+++ b/lib/driver/llvm.cc
@@ -239,14 +239,12 @@ std::string ptx_to_cubin(const std::string& ptx, const std::string& ptxas, int c
    unlink(_flog);
    throw std::runtime_error("Internal Triton PTX codegen error: \n" + log);
  }
-  CUmodule ret;
  std::ifstream _cubin(_fbin, std::ios::binary );
  std::string cubin(std::istreambuf_iterator<char>(_cubin), {});
  _cubin.close();
  unlink(_fsrc);
  unlink(_flog);
  unlink(_fbin);
-  dispatch::cuModuleLoadData(&ret, cubin.c_str());
  return cubin;
 }