[codegen/tune] bugfix in heuristics for nano-tile sizes
This commit is contained in:
@@ -1,6 +1,10 @@
|
||||
find_package(Torch)
|
||||
if(${Torch_FOUND})
|
||||
if(${TORCH_FOUND})
|
||||
set(CUDA_HOME "/usr/local/cuda")
|
||||
include_directories(${TORCH_INCLUDE_DIRS})
|
||||
include_directories("${CUDA_HOME}/include")
|
||||
link_directories(${TORCH_LIBRARY_DIRS})
|
||||
add_definitions(-D_GLIBCXX_USE_CXX11_ABI=0)
|
||||
add_library(torch_triton SHARED conv.cpp)
|
||||
target_compile_features(torch_triton PRIVATE cxx_range_for)
|
||||
target_link_libraries(torch_triton "${TORCH_LIBRARIES}")
|
||||
target_link_libraries(torch_triton torch triton)
|
||||
endif()
|
||||
|
Reference in New Issue
Block a user