[codegen/tune] bugfix in heuristics for nano-tile sizes

This commit is contained in:
Philippe Tillet
2019-05-04 01:32:34 -04:00
parent 0d694445e6
commit 30833c18f1
7 changed files with 143 additions and 121 deletions

View File

@@ -1,6 +1,10 @@
find_package(Torch)
if(${Torch_FOUND})
if(${TORCH_FOUND})
set(CUDA_HOME "/usr/local/cuda")
include_directories(${TORCH_INCLUDE_DIRS})
include_directories("${CUDA_HOME}/include")
link_directories(${TORCH_LIBRARY_DIRS})
add_definitions(-D_GLIBCXX_USE_CXX11_ABI=0)
add_library(torch_triton SHARED conv.cpp)
target_compile_features(torch_triton PRIVATE cxx_range_for)
target_link_libraries(torch_triton "${TORCH_LIBRARIES}")
target_link_libraries(torch_triton torch triton)
endif()