https://github.com/halide/Halide
Tip revision: 8918a0334837b106572e2313f5249ff7395bc401 authored by Steven Johnson on 20 October 2021, 18:03:11 UTC
fixes
fixes
Tip revision: 8918a03
CMakeLists.txt
if (NOT CMAKE_GENERATOR MATCHES "Make|Ninja")
message(STATUS "Notice: ${CMAKE_GENERATOR} does not support depfile dependencies. Incremental builds may fail.")
endif ()
# Keep these lists in alphabetical order.
set(RUNTIME_CPP
aarch64_cpu_features
alignment_128
alignment_32
alignment_64
allocation_cache
android_clock
android_host_cpu_count
android_io
arm_cpu_features
cache
can_use_target
cuda
destructors
device_interface
errors
fake_get_symbol
fake_thread_pool
float16_t
fuchsia_clock
fuchsia_host_cpu_count
fuchsia_yield
gpu_device_selection
halide_buffer_t
hexagon_cache_allocator
hexagon_cpu_features
hexagon_dma
hexagon_dma_pool
hexagon_host
ios_io
linux_clock
linux_host_cpu_count
linux_yield
matlab
metadata
metal
metal_objc_arm
metal_objc_x86
mips_cpu_features
module_aot_ref_count
module_jit_ref_count
msan
msan_stubs
opencl
opengl_egl_context
opengl_glx_context
openglcompute
osx_clock
osx_get_symbol
osx_host_cpu_count
osx_opengl_context
osx_yield
posix_allocator
posix_clock
posix_error_handler
posix_get_symbol
posix_io
posix_print
posix_threads
posix_threads_tsan
powerpc_cpu_features
prefetch
profiler
profiler_inlined
pseudostack
qurt_allocator
qurt_hvx
qurt_hvx_vtcm
qurt_threads
qurt_threads_tsan
qurt_yield
riscv_cpu_features
runtime_api
to_string
trace_helper
tracing
wasm_cpu_features
windows_clock
windows_cuda
windows_d3d12compute_x86
windows_d3d12compute_arm
windows_get_symbol
windows_io
windows_opencl
windows_profiler
windows_threads
windows_threads_tsan
windows_yield
write_debug_image
x86_cpu_features
)
set(RUNTIME_LL
aarch64
arm
arm_no_neon
hvx_128
mips
posix_math
powerpc
ptx_dev
wasm_math
win32_math
x86
x86_avx
x86_avx2
x86_avx512
x86_sse41
)
set(RUNTIME_BC
compute_20
compute_30
compute_35
)
set(RUNTIME_HEADER_FILES
HalideBuffer.h
HalidePyTorchCudaHelpers.h
HalidePyTorchHelpers.h
HalideRuntime.h
HalideRuntimeCuda.h
HalideRuntimeD3D12Compute.h
HalideRuntimeHexagonDma.h
HalideRuntimeHexagonHost.h
HalideRuntimeMetal.h
HalideRuntimeOpenCL.h
HalideRuntimeOpenGLCompute.h
HalideRuntimeQurt.h
)
# Need to create an object library for this because CMake
# doesn't support using target_sources on a target declared
# in a different directory ONLY IF that source was created
# by add_custom_command, as is the case in this directory.
add_library(Halide_initmod OBJECT)
# Note: ensure that these flags match the flags in the Makefile.
# Note: this always uses Clang-from-LLVM for compilation, so none of these flags should need conditionalization.
set(RUNTIME_CXX_FLAGS
-O3
-std=c++17
-ffreestanding
-fno-blocks
-fno-exceptions
-fno-unwind-tables
-fno-vectorize
# Note: we don't want static locals to get thread synchronization stuff.
-fno-threadsafe-statics
# Necessary for using virtual functions in the runtime code.
-fno-rtti
-Wall
-Wcast-qual
-Werror
-Wignored-qualifiers
-Wno-comment
-Wno-psabi
-Wno-unknown-warning-option
-Wno-unused-function
-Wsign-compare
)
foreach (i IN LISTS RUNTIME_CPP)
foreach (j IN ITEMS 32 64)
# -fpic needs special treatment; see below on windows 64bits
set(fpic -fpic)
# for the generic windows 64-bit target, we need -fshort-wchar
set(fshort-wchar "")
# Windows
if (i MATCHES "windows_.*")
# must omit -fpic, otherwise clang will complain with the following:
# clang : error : unsupported option '-fpic' for target 'x86_64-pc-windows-msvc'
set(fpic "")
# Windows x86/x64
if (i MATCHES "windows_.*_x86$")
if (j EQUAL 32)
# win32 uses the stdcall calling convention, which is x86-specific
set(TARGET "i386-unknown-windows-unknown")
else ()
set(TARGET "x86_64-unknown-windows-unknown")
endif ()
# Windows on ARM
elseif (i MATCHES "windows_.*_arm$")
if (j EQUAL 32 AND TARGET_ARM)
set(TARGET "arm-unknown-windows-unknown")
elseif (j EQUAL 64 AND TARGET_AARCH64)
set(TARGET "aarch64-unknown-windows-unknown")
else ()
continue()
endif ()
# Windows Generic
else()
if (j EQUAL 32)
# TODO(marcos): generic code won't hold for ARM32... If ARM32 support becomes necessary,
# all windows-related runtime modules will have to be wrapped in windows_*_arm.cpp files
# for now, generic Windows 32bit code just assumes x86 (i386)
set(TARGET "i386-unknown-windows-unknown")
else ()
# unfortunately, clang doesn't automatically set this flag even though the
# ABI is msvc on windows
set(fshort-wchar -fshort-wchar)
set(TARGET "le64-unknown-windows-unknown")
endif ()
endif()
# Everything else
else()
if (j EQUAL 32)
# (The 'nacl' is a red herring. This is just a generic 32-bit little-endian target.)
set(TARGET "le32-unknown-nacl-unknown")
else ()
# generic 64-bit code
set(TARGET "le64-unknown-unknown-unknown")
endif ()
endif ()
set(SOURCE "${CMAKE_CURRENT_SOURCE_DIR}/${i}.cpp")
set(RUNTIME_DEFINES -DCOMPILING_HALIDE_RUNTIME -DBITS_${j})
set(RUNTIME_DEFINES_debug -g -DDEBUG_RUNTIME ${RUNTIME_DEFINES})
foreach (SUFFIX IN ITEMS "" "_debug")
set(basename "initmod.${i}_${j}${SUFFIX}")
set(LL "${basename}.ll")
set(BC "${basename}.bc")
set(INITMOD "_initmod_${i}_${j}${SUFFIX}.cpp")
set(SYMBOL "halide_internal_initmod_${i}_${j}${SUFFIX}")
set(clang_flags ${RUNTIME_CXX_FLAGS} ${fpic} ${fshort-wchar} ${RUNTIME_DEFINES${SUFFIX}} -m${j} -target ${TARGET} -emit-llvm -S)
set(ll_path "${LL}")
if (CMAKE_GENERATOR MATCHES "Ninja")
if (POLICY CMP0116)
# CMake 3.20+ does the right thing here and transforms the depfiles for us
list(APPEND clang_flags -MD -MF "${basename}.d")
set(dep_args DEPFILE "${basename}.d")
else()
# Dep-files are subtle and require clang to run using *just* the right
# relative paths to the build root, NOT the Halide build root. This is
# a perfect storm of bad behavior from CMake <3.20, Ninja, and Clang.
file(RELATIVE_PATH ll_path "${CMAKE_BINARY_DIR}" "${CMAKE_CURRENT_BINARY_DIR}/${LL}")
file(TO_NATIVE_PATH "${ll_path}" ll_path)
list(APPEND clang_flags -MD -MF "$<SHELL_PATH:${CMAKE_CURRENT_BINARY_DIR}/${basename}.d>")
set(dep_args
WORKING_DIRECTORY "${CMAKE_BINARY_DIR}"
DEPFILE "${CMAKE_CURRENT_BINARY_DIR}/${basename}.d")
endif()
elseif (CMAKE_GENERATOR MATCHES "Make")
set(dep_args IMPLICIT_DEPENDS CXX "${SOURCE}")
endif ()
if (Halide_CLANG_TIDY_BUILD)
# Create a 'fake' entry just so that clang-tidy will see a C++ compilation command
# that it can use for tidy-checking. (This branch should never be taken by 'normal'
# compilations.)
add_library(${basename} STATIC "${SOURCE}")
target_compile_options(${basename} PRIVATE ${RUNTIME_CXX_FLAGS} ${fpic} ${fshort-wchar} -m${j} -target ${TARGET})
target_compile_definitions(${basename} PRIVATE ${RUNTIME_DEFINES})
else()
add_custom_command(OUTPUT "${LL}"
COMMAND clang ${clang_flags} -o "${ll_path}" "$<SHELL_PATH:${SOURCE}>"
DEPENDS "${SOURCE}"
${dep_args}
VERBATIM)
endif()
add_custom_command(OUTPUT "${BC}"
COMMAND llvm-as "${LL}" -o "${BC}"
DEPENDS "${LL}"
VERBATIM)
add_custom_command(OUTPUT "${INITMOD}"
COMMAND binary2cpp ${SYMBOL} < "${BC}" > "${INITMOD}"
DEPENDS "${BC}" binary2cpp
VERBATIM)
target_sources(Halide_initmod PRIVATE ${INITMOD})
endforeach ()
endforeach ()
endforeach ()
foreach (i IN LISTS RUNTIME_LL)
set(LL "${i}.ll")
set(BC "initmod.${i}.bc")
set(INITMOD "_initmod_${i}.cpp")
add_custom_command(OUTPUT "${BC}"
COMMAND llvm-as "$<SHELL_PATH:${CMAKE_CURRENT_SOURCE_DIR}/${LL}>" -o "${BC}"
DEPENDS "${LL}"
VERBATIM)
add_custom_command(OUTPUT "${INITMOD}"
COMMAND binary2cpp "halide_internal_initmod_${i}_ll" < "${BC}" > "${INITMOD}"
DEPENDS "${BC}" binary2cpp
VERBATIM)
target_sources(Halide_initmod PRIVATE ${INITMOD})
endforeach ()
foreach (i IN LISTS RUNTIME_BC)
set(INITMOD "_initmod_ptx_${i}.cpp")
set(RT_BC "${CMAKE_CURRENT_SOURCE_DIR}/nvidia_libdevice_bitcode/libdevice.${i}.10.bc")
add_custom_command(OUTPUT "${INITMOD}"
COMMAND binary2cpp "halide_internal_initmod_ptx_${i}_ll" < "$<SHELL_PATH:${RT_BC}>" > "${INITMOD}"
DEPENDS binary2cpp "${RT_BC}"
VERBATIM)
target_sources(Halide_initmod PRIVATE ${INITMOD})
endforeach ()
add_custom_command(OUTPUT "_initmod_inlined_c.cpp"
COMMAND binary2cpp "halide_internal_initmod_inlined_c" < "$<SHELL_PATH:${CMAKE_CURRENT_SOURCE_DIR}/halide_buffer_t.cpp>" > "_initmod_inlined_c.cpp"
DEPENDS "halide_buffer_t.cpp" binary2cpp
VERBATIM)
target_sources(Halide_initmod PRIVATE "_initmod_inlined_c.cpp")
foreach (i IN LISTS RUNTIME_HEADER_FILES)
string(REPLACE "." "_" SYM_NAME "${i}")
add_custom_command(OUTPUT "_initmod_${SYM_NAME}.cpp"
COMMAND binary2cpp "halide_internal_runtime_header_${SYM_NAME}" < "$<SHELL_PATH:${CMAKE_CURRENT_SOURCE_DIR}/${i}>" > "_initmod_${SYM_NAME}.cpp"
DEPENDS "${i}" binary2cpp
VERBATIM)
target_sources(Halide_initmod PRIVATE "_initmod_${SYM_NAME}.cpp")
configure_file(${i} "${Halide_BINARY_DIR}/include/${i}" COPYONLY)
endforeach ()
##
# Target for the runtime
##
add_library(Halide_Runtime INTERFACE)
add_library(Halide::Runtime ALIAS Halide_Runtime)
target_include_directories(Halide_Runtime INTERFACE $<BUILD_INTERFACE:${Halide_BINARY_DIR}/include>)
set_target_properties(Halide_Runtime PROPERTIES EXPORT_NAME Runtime)