This PR does the following: - CUDA utilities (e.g., cuGetInfo) won't be compiled as part of libtriton.so anymore. - Refactoring driver/llvm.cc to split it between PTX codegen and python. - By extension this will also deprecate include/external so Triton won't have to live with a copy of some CUDA/Hip headers anymore. - `triton-translate` becomes a `triton.tools.aot` Python utility that re-uses functions from the triton.compile sub-module.
17 lines
435 B
MLIR
17 lines
435 B
MLIR
// RUN: python3 -m triton.tools.aot %s --target=llvm-ir | FileCheck %s
|
|
|
|
// == LLVM IR check begin ==
|
|
// CHECK-LABEL: ; ModuleID = 'LLVMDialectModule'
|
|
// CHECK: define void @test_empty_kernel
|
|
// CHECK: !nvvm.annotations
|
|
// CHECK: !{void (i32, half addrspace(1)*)* @test_empty_kernel, !"maxntidx", i32 128}
|
|
|
|
module attributes {"triton_gpu.num-warps" = 4 : i32} {
|
|
|
|
func @test_empty_kernel(%lb : index, %A : !tt.ptr<f16>) {
|
|
|
|
return
|
|
}
|
|
|
|
}
|