[FRONTEND] Make sure to hold the gil when creating python objects (#726)

Without this patch, a debug version of python complains that: ``` Fatal Python error: Python memory allocator called without holding the GIL Python runtime state: initialized ```
2022-09-29 21:06:22 -04:00
parent dad97528b2
commit f45e31ba7c
1 changed files with 40 additions and 35 deletions
--- a/python/src/triton.cc
+++ b/python/src/triton.cc
@@ -437,13 +437,16 @@ typedef std::map<std::string, py::object> asm_map_t;
 void init_triton_codegen(py::module &&m) {
  m.def("compile_ttir",
      [](backend_t backend, ir::module &ir, uint64_t device, int num_warps, int num_stages, py::dict& extern_libs, size_t cc) {
          py::gil_scoped_release allow_threads;
          std::string name = ir.get_function_list()[0]->get_name();
          // record asm as we generate
          asm_map_t asm_map;
          std::ostringstream ttir;
          int n_shared_bytes;
          std::string tmp;
          std::string ptx;
          std::string cubin;
          std::string name;
          { // Scope where the GIL is released
            py::gil_scoped_release allow_threads;
            name = ir.get_function_list()[0]->get_name();
            ir.print(ttir);
          asm_map["ttir"] = py::cast(ttir.str());
            llvm::LLVMContext ctx;
            // construct extern lib map
            triton::codegen::ExternLibMap extern_lib_map;
@@ -464,19 +467,21 @@ void init_triton_codegen(py::module &&m) {
            std::string ptxas_path = drv::path_to_ptxas(version);
            // Triton-IR -> NVPTX LLVM-IR
            triton::codegen::nvidia_cu_target target(cc);
          int n_shared_bytes;
            auto llvm = triton::codegen::add_passes_to_emit_bin(
                ir, ctx, &target, num_warps, num_stages, n_shared_bytes, extern_lib_map);
          std::string tmp;
            llvm::raw_string_ostream llir(tmp);
            llir << *llvm;
            llir.flush();
          asm_map["llir"] = py::cast(tmp);
            // LLVM-IR -> PTX
-          std::string ptx = drv::llir_to_ptx(llvm.get(), cc, version);
+            ptx = drv::llir_to_ptx(llvm.get(), cc, version);
          asm_map["ptx"] = py::cast(ptx);
            // PTX -> Binary
-          std::string cubin = drv::ptx_to_cubin(ptx, ptxas_path, cc);
+            cubin = drv::ptx_to_cubin(ptx, ptxas_path, cc);
          }
          asm_map_t asm_map;
          asm_map["ttir"] = py::cast(ttir.str());
          asm_map["llir"] = py::cast(tmp);
          asm_map["ptx"] = py::cast(ptx);
          if(!cubin.empty()){
            py::bytes bytes(cubin);
            asm_map["cubin"] = bytes;