2020-11-08 21:33:18 -05:00
|
|
|
include_guard(GLOBAL)
|
|
|
|
|
|
|
|
include(CheckCXXCompilerFlag)
|
|
|
|
include(CheckSymbolExists)
|
|
|
|
include(CMakePushCheckState)
|
|
|
|
|
|
|
|
set(TEST_DIR ${PROJECT_SOURCE_DIR}/cmake/test)
|
|
|
|
|
|
|
|
if(CMAKE_CXX_COMPILER_ID MATCHES "Clang")
|
2019-05-01 05:54:58 -04:00
|
|
|
set(C_CLANG 1)
|
2020-11-08 21:33:18 -05:00
|
|
|
elseif(MAKE_CXX_COMPILER_ID MATCHES "GNU")
|
2019-05-01 05:54:58 -04:00
|
|
|
set(C_GCC 1)
|
2020-11-08 21:33:18 -05:00
|
|
|
elseif(CMAKE_CXX_COMPILER_ID MATCHES "MSVC")
|
2019-05-01 05:54:58 -04:00
|
|
|
set(C_MSVC 1)
|
|
|
|
endif()
|
|
|
|
|
|
|
|
# Detect current compilation architecture and create standard definitions
|
2020-11-08 21:33:18 -05:00
|
|
|
macro(detect_architecture symbol arch)
|
2019-05-01 05:54:58 -04:00
|
|
|
if (NOT DEFINED ARCHITECTURE)
|
|
|
|
check_symbol_exists("${symbol}" "" ARCHITECTURE_${arch})
|
|
|
|
|
|
|
|
if (ARCHITECTURE_${arch})
|
2020-11-08 21:33:18 -05:00
|
|
|
set(ARCHITECTURE ${arch})
|
|
|
|
set(ARCHITECTURE_${arch} TRUE)
|
|
|
|
add_compile_definitions(ARCHITECTURE_${arch})
|
2019-05-01 05:54:58 -04:00
|
|
|
endif()
|
|
|
|
endif()
|
2020-11-08 21:33:18 -05:00
|
|
|
endmacro()
|
|
|
|
|
|
|
|
macro(force_ext_available extension)
|
|
|
|
message(STATUS "Looking for __${extension}__ - forced found")
|
|
|
|
set(HAS_${extension} 1 CACHE INTERNAL "")
|
|
|
|
endmacro()
|
|
|
|
|
|
|
|
function(detect_extensions extension)
|
|
|
|
unset(HAS_${extension})
|
|
|
|
if (ARGC EQUAL 2 AND (${ARGV1})) # force available
|
|
|
|
force_ext_available(${extension})
|
|
|
|
endif()
|
|
|
|
check_symbol_exists("__${extension}__" "" HAS_${extension})
|
|
|
|
if (HAS_${extension})
|
|
|
|
add_compile_definitions(USE_${extension})
|
|
|
|
endif()
|
2019-05-01 05:54:58 -04:00
|
|
|
endfunction()
|
|
|
|
|
2020-11-08 21:33:18 -05:00
|
|
|
function(detect_msvc_native_opt)
|
|
|
|
try_run(RUN_AVX512 COMPILE_AVX512 "${CMAKE_BINARY_DIR}/tmp" "${TEST_DIR}/test_x86_avx512.cxx" COMPILE_DEFINITIONS /arch:AVX512)
|
|
|
|
if (COMPILE_AVX512 AND RUN_AVX512 EQUAL 0)
|
|
|
|
set(ARCH_OPT "AVX512" PARENT_SCOPE)
|
|
|
|
return()
|
|
|
|
endif()
|
|
|
|
try_run(RUN_AVX2 COMPILE_AVX2 "${CMAKE_BINARY_DIR}/tmp" "${TEST_DIR}/test_x86_avx2.cxx" COMPILE_DEFINITIONS /arch:AVX2)
|
|
|
|
if (COMPILE_AVX2 AND RUN_AVX2 EQUAL 0)
|
|
|
|
set(ARCH_OPT "AVX2" PARENT_SCOPE)
|
|
|
|
return()
|
|
|
|
endif()
|
|
|
|
try_run(RUN_AVX COMPILE_AVX "${CMAKE_BINARY_DIR}/tmp" "${TEST_DIR}/test_x86_avx.cxx" COMPILE_DEFINITIONS /arch:AVX)
|
|
|
|
if (COMPILE_AVX AND RUN_AVX EQUAL 0)
|
|
|
|
set(ARCH_OPT "AVX" PARENT_SCOPE)
|
|
|
|
return()
|
|
|
|
endif()
|
|
|
|
|
|
|
|
# Supporting 32-bit x86, what year is it?
|
|
|
|
set(COMPILE_DEF "")
|
|
|
|
set(ARCH_OPT "" PARENT_SCOPE)
|
|
|
|
if (ARCHITECTURE_x86)
|
|
|
|
set(COMPILE_DEF "/arch:SSE2")
|
|
|
|
set(ARCH_OPT "SSE2" PARENT_SCOPE)
|
|
|
|
endif()
|
|
|
|
|
|
|
|
try_run(RUN_SSE42 COMPILE_SSE42 "${CMAKE_BINARY_DIR}/tmp" "${TEST_DIR}/test_x86_sse42.cxx" COMPILE_DEFINITIONS ${COMPILE_DEF})
|
|
|
|
if (COMPILE_SSE42 AND RUN_SSE42 EQUAL 0)
|
|
|
|
force_ext_available(SSE4_2)
|
|
|
|
return()
|
|
|
|
endif()
|
|
|
|
try_run(RUN_SSE41 COMPILE_SSE41 "${CMAKE_BINARY_DIR}/tmp" "${TEST_DIR}/test_x86_sse41.cxx" COMPILE_DEFINITIONS ${COMPILE_DEF})
|
|
|
|
if (COMPILE_SSE41 AND RUN_SSE41 EQUAL 0)
|
|
|
|
force_ext_available(SSE4_1)
|
|
|
|
return()
|
|
|
|
endif()
|
|
|
|
try_run(RUN_SSSE3 COMPILE_SSSE3 "${CMAKE_BINARY_DIR}/tmp" "${TEST_DIR}/test_x86_ssse3.cxx" COMPILE_DEFINITIONS ${COMPILE_DEF})
|
|
|
|
if (COMPILE_SSSE3 AND RUN_SSSE3 EQUAL 0)
|
|
|
|
force_ext_available(SSSE3)
|
|
|
|
return()
|
|
|
|
endif()
|
|
|
|
try_run(RUN_SSE3 COMPILE_SSE3 "${CMAKE_BINARY_DIR}/tmp" "${TEST_DIR}/test_x86_sse3.cxx" COMPILE_DEFINITIONS ${COMPILE_DEF})
|
|
|
|
if (COMPILE_SSE3 AND RUN_SSE3 EQUAL 0)
|
|
|
|
force_ext_available(SSE3)
|
|
|
|
return()
|
|
|
|
endif()
|
|
|
|
try_run(RUN_SSE2 COMPILE_SSE2 "${CMAKE_BINARY_DIR}/tmp" "${TEST_DIR}/test_x86_sse2.cxx" COMPILE_DEFINITIONS ${COMPILE_DEF})
|
|
|
|
if (COMPILE_SSE2 AND RUN_SSE2 EQUAL 0)
|
|
|
|
force_ext_available(SSE2)
|
|
|
|
return()
|
|
|
|
endif()
|
|
|
|
|
|
|
|
if (ARCHITECTURE_x86)
|
|
|
|
# At this point we might as well...
|
|
|
|
set(ARCH_OPT "IA32" PARENT_SCOPE)
|
|
|
|
return()
|
|
|
|
endif()
|
|
|
|
endfunction()
|
|
|
|
|
|
|
|
if (C_MSVC)
|
|
|
|
detect_architecture("_M_AMD64" x86_64)
|
|
|
|
detect_architecture("_M_IX86" x86)
|
|
|
|
detect_architecture("_M_ARM" ARM)
|
|
|
|
detect_architecture("_M_ARM64" ARM64)
|
|
|
|
else()
|
|
|
|
detect_architecture("__x86_64__" x86_64)
|
|
|
|
detect_architecture("__i386__" x86)
|
|
|
|
detect_architecture("__arm__" ARM)
|
|
|
|
detect_architecture("__aarch64__" ARM64)
|
2019-05-01 05:54:58 -04:00
|
|
|
endif()
|
|
|
|
if (NOT DEFINED ARCHITECTURE)
|
2020-11-08 21:33:18 -05:00
|
|
|
message(FATAL_ERROR "Not supported. Please add needed architecture detection.")
|
2019-05-01 05:54:58 -04:00
|
|
|
endif()
|
|
|
|
|
2020-11-08 21:33:18 -05:00
|
|
|
# Note: On x86 MSVC's /arch:SSE2 enables all SSE intrinsics support and is default option.
|
|
|
|
# On x86_64 MSVC's SSE is supported and enabled, so only AVX selection is needed.
|
2019-05-01 05:54:58 -04:00
|
|
|
|
2020-11-08 21:33:18 -05:00
|
|
|
if (FORCE_SSSE3)
|
|
|
|
message(WARNING "FORCE_SSSE3 flag is deprecated, please use ARCH_OPT option.")
|
|
|
|
set(ARCH_OPT "")
|
|
|
|
if (C_MSVC)
|
|
|
|
if (ARCHITECTURE_x86)
|
|
|
|
set(ARCH_OPT "SSE2")
|
|
|
|
endif()
|
|
|
|
force_ext_available(SSSE3)
|
|
|
|
else()
|
|
|
|
set(FORCE_OPT "-mssse3")
|
|
|
|
endif()
|
2019-05-01 05:54:58 -04:00
|
|
|
endif()
|
2020-11-08 21:33:18 -05:00
|
|
|
|
|
|
|
if (FORCE_SSE41)
|
|
|
|
message(WARNING "FORCE_SSE41 flag is deprecated, please use ARCH_OPT option.")
|
|
|
|
set(ARCH_OPT "")
|
|
|
|
if (C_MSVC)
|
|
|
|
if (ARCHITECTURE_x86)
|
|
|
|
set(ARCH_OPT "SSE2")
|
|
|
|
else()
|
|
|
|
force_ext_available(SSE4_1)
|
|
|
|
endif()
|
|
|
|
else()
|
|
|
|
set(FORCE_OPT "-msse4.1")
|
|
|
|
endif()
|
|
|
|
endif()
|
|
|
|
|
|
|
|
if (C_MSVC)
|
|
|
|
# Glue to make ARCH_OPT more flexible for MSVC
|
|
|
|
if (ARCH_OPT STREQUAL "native")
|
|
|
|
detect_msvc_native_opt()
|
|
|
|
elseif(ARCH_OPT STREQUAL "SSE4_2")
|
|
|
|
force_ext_available(SSE4_2)
|
|
|
|
set(ARCH_OPT "")
|
|
|
|
elseif(ARCH_OPT STREQUAL "SSE4_1")
|
|
|
|
force_ext_available(SSE4_1)
|
|
|
|
set(ARCH_OPT "")
|
|
|
|
elseif(ARCH_OPT STREQUAL "SSSE3")
|
|
|
|
force_ext_available(SSSE3)
|
|
|
|
set(ARCH_OPT "")
|
|
|
|
elseif(ARCH_OPT STREQUAL "SSE3")
|
|
|
|
force_ext_available(SSE3)
|
|
|
|
set(ARCH_OPT "")
|
|
|
|
elseif(ARCH_OPT STREQUAL "SSE2")
|
|
|
|
force_ext_available(SSE2)
|
|
|
|
set(ARCH_OPT "")
|
|
|
|
endif()
|
|
|
|
endif()
|
|
|
|
|
|
|
|
message(STATUS "Target architecture: ${ARCHITECTURE}-${ARCH_OPT}")
|
|
|
|
|
|
|
|
cmake_push_check_state(RESET)
|
|
|
|
if (ARCH_OPT)
|
|
|
|
if(C_MSVC)
|
|
|
|
set(CMAKE_REQUIRED_FLAGS "/arch:${ARCH_OPT}")
|
|
|
|
add_compile_options(${CMAKE_REQUIRED_FLAGS})
|
|
|
|
else()
|
|
|
|
set(CMAKE_REQUIRED_FLAGS "-march=${ARCH_OPT}")
|
|
|
|
add_compile_options(-march=${ARCH_OPT})
|
|
|
|
endif()
|
|
|
|
elseif(FORCE_SSSE3 OR FORCE_SSE41)
|
|
|
|
if (NOT C_MSVC)
|
|
|
|
set(CMAKE_REQUIRED_FLAGS ${FORCE_OPT})
|
|
|
|
add_compile_options(${FORCE_OPT})
|
|
|
|
endif()
|
|
|
|
endif()
|
|
|
|
|
|
|
|
check_cxx_compiler_flag("${CMAKE_REQUIRED_FLAGS}" FLAG_SUPPORTED)
|
|
|
|
if (NOT FLAG_SUPPORTED)
|
|
|
|
message(FATAL_ERROR "Flag '${CMAKE_REQUIRED_FLAGS}' rejected by compiler. Please adjust ARCH_OPT option.")
|
|
|
|
endif()
|
|
|
|
|
|
|
|
if (ARCHITECTURE_ARM)
|
|
|
|
if (C_MSVC)
|
|
|
|
force_ext_available(ARM_NEON)
|
|
|
|
else()
|
|
|
|
list(APPEND CMAKE_REQUIRED_FLAGS -mfpu=neon)
|
|
|
|
endif()
|
|
|
|
endif()
|
|
|
|
|
|
|
|
# This is quite basic detection, can be extended if needed
|
|
|
|
detect_extensions(ARM_NEON)
|
|
|
|
detect_extensions(AVX512F)
|
|
|
|
detect_extensions(AVX2 HAS_AVX512F)
|
|
|
|
detect_extensions(AVX HAS_AVX2)
|
|
|
|
detect_extensions(SSE4_2 HAS_AVX)
|
|
|
|
detect_extensions(SSE4_1 HAS_SSE4_2)
|
|
|
|
detect_extensions(SSSE3 HAS_SSE4_1)
|
|
|
|
detect_extensions(SSE3 HAS_SSSE3)
|
|
|
|
detect_extensions(SSE2 HAS_SSE3)
|
|
|
|
|
|
|
|
cmake_pop_check_state()
|
|
|
|
|
|
|
|
set(CMAKE_INTERPROCEDURAL_OPTIMIZATION ON)
|
|
|
|
if (C_CLANG OR C_GCC)
|
|
|
|
add_compile_options(-Wall -Wextra -Wvla -Woverloaded-virtual -ffast-math -ftree-vectorize)
|
|
|
|
elseif (C_MSVC)
|
|
|
|
add_compile_options(/MP)
|
|
|
|
endif()
|
|
|
|
|
|
|
|
if (SANITIZE_ADDRESS)
|
|
|
|
message(STATUS "Activate address sanitization")
|
|
|
|
if(MSVC)
|
|
|
|
set(ASAN_LIB_ARCH ${MSVC_CXX_ARCHITECTURE_ID})
|
|
|
|
string(TOLOWER ${ASAN_LIB_ARCH} ASAN_LIB_ARCH)
|
|
|
|
if(ASAN_LIB_ARCH STREQUAL "x86")
|
|
|
|
set(ASAN_LIB_ARCH "i386")
|
|
|
|
elseif(ASAN_LIB_ARCH STREQUAL "x64")
|
|
|
|
set(ASAN_LIB_ARCH "x86_64")
|
|
|
|
endif()
|
|
|
|
add_compile_options(/fsanitize=address)
|
|
|
|
link_libraries(clang_rt.asan_dynamic-${ASAN_LIB_ARCH} clang_rt.asan_dynamic_runtime_thunk-${ASAN_LIB_ARCH})
|
|
|
|
add_link_options(/wholearchive:clang_rt.asan_dynamic_runtime_thunk-${ASAN_LIB_ARCH}.lib)
|
|
|
|
else()
|
|
|
|
add_compile_options(-fsanitize=address -fno-omit-frame-pointer -g)
|
|
|
|
add_link_options(-fsanitize=address)
|
|
|
|
endif()
|
2019-05-01 05:54:58 -04:00
|
|
|
endif()
|
|
|
|
|
|
|
|
# clear binary test folder
|
|
|
|
FILE(REMOVE_RECURSE ${CMAKE_BINARY_DIR}/tmp)
|