summaryrefslogtreecommitdiffstats
path: root/cmake/modules/FindSSE.cmake
diff options
context:
space:
mode:
Diffstat (limited to 'cmake/modules/FindSSE.cmake')
-rw-r--r--cmake/modules/FindSSE.cmake195
1 files changed, 195 insertions, 0 deletions
diff --git a/cmake/modules/FindSSE.cmake b/cmake/modules/FindSSE.cmake
new file mode 100644
index 0000000..d9d5c7a
--- /dev/null
+++ b/cmake/modules/FindSSE.cmake
@@ -0,0 +1,195 @@
+# Check if SSE instructions are available on the machine where
+# the project is compiled.
+include(TestCXXAcceptsFlag)
+
+if(CMAKE_SYSTEM_NAME MATCHES "Linux")
+ if(CPU MATCHES "x86_64" OR CPU MATCHES "i.86")
+ exec_program(cat ARGS "/proc/cpuinfo" OUTPUT_VARIABLE CPUINFO)
+
+ string(REGEX REPLACE "^.*(sse).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "sse" "${_SSE_THERE}" _SSE_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-msse" _SSE_OK)
+
+ string(REGEX REPLACE "^.*(sse2).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "sse2" "${_SSE_THERE}" _SSE2_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-msse2" _SSE2_OK)
+
+ # SSE3 is also known as the Prescott New Instructions (PNI)
+ # it's labeled as pni in /proc/cpuinfo
+ string(REGEX REPLACE "^.*(pni).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "pni" "${_SSE_THERE}" _SSE3_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-msse3" _SSE3_OK)
+
+ string(REGEX REPLACE "^.*(ssse3).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "ssse3" "${_SSE_THERE}" _SSSE3_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-mssse3" _SSSE3_OK)
+
+ string(REGEX REPLACE "^.*(sse4_1).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "sse4_1" "${_SSE_THERE}" _SSE41_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-msse4.1" _SSE41_OK)
+
+ string(REGEX REPLACE "^.*(sse4_2).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "sse4_2" "${_SSE_THERE}" _SSE42_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-msse4.2" _SSE42_OK)
+
+ string(REGEX REPLACE "^.*(avx).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "avx" "${_SSE_THERE}" _AVX_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-mavx" _AVX_OK)
+
+ string(REGEX REPLACE "^.*(avx2).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "avx2" "${_SSE_THERE}" _AVX2_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-mavx2" _AVX2_OK)
+ endif()
+elseif(CMAKE_SYSTEM_NAME MATCHES "FreeBSD")
+ if(CPU MATCHES "amd64" OR CPU MATCHES "i.86")
+ exec_program(cat ARGS "/var/run/dmesg.boot | grep Features" OUTPUT_VARIABLE CPUINFO)
+
+ string(REGEX REPLACE "^.*(SSE).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "SSE" "${_SSE_THERE}" _SSE_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-msse" _SSE_OK)
+
+ string(REGEX REPLACE "^.*(SSE2).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "SSE2" "${_SSE_THERE}" _SSE2_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-msse2" _SSE2_OK)
+
+ string(REGEX REPLACE "^.*(SSE3).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "SSE3" "${_SSE_THERE}" _SSE3_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-msse3" _SSE3_OK)
+
+ string(REGEX REPLACE "^.*(SSSE3).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "SSSE3" "${_SSE_THERE}" _SSSE3_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-mssse3" _SSSE3_OK)
+
+ string(REGEX REPLACE "^.*(SSE4.1).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "SSE4.1" "${_SSE_THERE}" _SSE41_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-msse4.1" _SSE41_OK)
+ string(REGEX REPLACE "^.*(SSE4.2).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "SSE4.2" "${_SSE_THERE}" _SSE42_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-msse4.2" _SSE42_OK)
+
+ string(REGEX REPLACE "^.*(AVX).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "AVX" "${_SSE_THERE}" _AVX_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-mavx" _AVX_OK)
+
+ string(REGEX REPLACE "^.*(AVX2).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "AVX2" "${_SSE_THERE}" _AVX2_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-mavx2" _AVX2_OK)
+ endif()
+elseif(CMAKE_SYSTEM_NAME MATCHES "Android")
+ if(CPU MATCHES "x86_64" OR CPU MATCHES "i.86")
+ set(_SSE_TRUE TRUE)
+ set(_SSE2_TRUE TRUE)
+ set(_SSE3_TRUE TRUE)
+ set(_SSSE3_TRUE TRUE)
+
+ CHECK_CXX_ACCEPTS_FLAG("-msse" _SSE_OK)
+ CHECK_CXX_ACCEPTS_FLAG("-msse2" _SSE2_OK)
+ CHECK_CXX_ACCEPTS_FLAG("-msse3" _SSE3_OK)
+ CHECK_CXX_ACCEPTS_FLAG("-mssse3" _SSSE3_OK)
+ CHECK_CXX_ACCEPTS_FLAG("-msse4.1" _SSE41_OK)
+ CHECK_CXX_ACCEPTS_FLAG("-msse4.2" _SSE42_OK)
+ CHECK_CXX_ACCEPTS_FLAG("-mavx" _AVX_OK)
+ CHECK_CXX_ACCEPTS_FLAG("-mavx2" _AVX2_OK)
+ endif()
+elseif(CMAKE_SYSTEM_NAME MATCHES "Darwin")
+ if(NOT CPU MATCHES "arm")
+ exec_program("/usr/sbin/sysctl -n machdep.cpu.features machdep.cpu.leaf7_features" OUTPUT_VARIABLE CPUINFO)
+
+ string(REGEX REPLACE "^.*[^S](SSE).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "SSE" "${_SSE_THERE}" _SSE_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-msse" _SSE_OK)
+
+ string(REGEX REPLACE "^.*[^S](SSE2).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "SSE2" "${_SSE_THERE}" _SSE2_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-msse2" _SSE2_OK)
+
+ string(REGEX REPLACE "^.*[^S](SSE3).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "SSE3" "${_SSE_THERE}" _SSE3_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-msse3" _SSE3_OK)
+
+ string(REGEX REPLACE "^.*(SSSE3).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "SSSE3" "${_SSE_THERE}" _SSSE3_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-mssse3" _SSSE3_OK)
+
+ string(REGEX REPLACE "^.*(SSE4.1).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "SSE4.1" "${_SSE_THERE}" _SSE41_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-msse4.1" _SSE41_OK)
+
+ string(REGEX REPLACE "^.*(SSE4.2).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "SSE4.2" "${_SSE_THERE}" _SSE42_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-msse4.2" _SSE42_OK)
+
+ string(REGEX REPLACE "^.*(AVX).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "AVX" "${_SSE_THERE}" _AVX_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-mavx" _AVX_OK)
+
+ string(REGEX REPLACE "^.*(AVX2).*$" "\\1" _SSE_THERE ${CPUINFO})
+ string(COMPARE EQUAL "AVX2" "${_SSE_THERE}" _AVX2_TRUE)
+ CHECK_CXX_ACCEPTS_FLAG("-mavx2" _AVX2_OK)
+ endif()
+elseif(CMAKE_SYSTEM_NAME MATCHES "Windows")
+ # TODO
+ if(ARCH STREQUAL win32 OR ARCH STREQUAL x64)
+ set(_SSE_TRUE true)
+ set(_SSE_OK true)
+ set(_SSE2_TRUE true)
+ set(_SSE2_OK true)
+ endif()
+endif()
+
+include(FindPackageHandleStandardArgs)
+find_package_handle_standard_args(SSE
+ REQUIRED_VARS _SSE_TRUE _SSE_OK
+ FAIL_MESSAGE "Could not find hardware support for SSE")
+set(FPHSA_NAME_MISMATCHED ON)
+find_package_handle_standard_args(SSE2
+ REQUIRED_VARS _SSE2_TRUE _SSE2_OK
+ FAIL_MESSAGE "Could not find hardware support for SSE2")
+find_package_handle_standard_args(SSE3
+ REQUIRED_VARS _SSE3_TRUE _SSE3_OK
+ FAIL_MESSAGE "Could not find hardware support for SSE3")
+find_package_handle_standard_args(SSSE3
+ REQUIRED_VARS _SSSE3_TRUE _SSSE3_OK
+ FAIL_MESSAGE "Could not find hardware support for SSSE3")
+find_package_handle_standard_args(SSE4_1
+ REQUIRED_VARS _SSE41_TRUE _SSE41_OK
+ FAIL_MESSAGE "Could not find hardware support for SSE4.1")
+find_package_handle_standard_args(SSE4_2
+ REQUIRED_VARS _SSE42_TRUE _SSE42_OK
+ FAIL_MESSAGE "Could not find hardware support for SSE4.2")
+find_package_handle_standard_args(AVX
+ REQUIRED_VARS _AVX_TRUE _AVX_OK
+ FAIL_MESSAGE "Could not find hardware support for AVX")
+find_package_handle_standard_args(AVX2
+ REQUIRED_VARS _AVX2_TRUE _AVX2_OK
+ FAIL_MESSAGE "Could not find hardware support for AVX2")
+unset(FPHSA_NAME_MISMATCHED)
+
+mark_as_advanced(SSE2_FOUND SSE3_FOUND SSSE3_FOUND SSE4_1_FOUND SSE4_2_FOUND AVX_FOUND AVX2_FOUND)
+
+unset(_SSE_THERE)
+unset(_SSE_TRUE)
+unset(_SSE_OK)
+unset(_SSE_OK CACHE)
+unset(_SSE2_TRUE)
+unset(_SSE2_OK)
+unset(_SSE2_OK CACHE)
+unset(_SSE3_TRUE)
+unset(_SSE3_OK)
+unset(_SSE3_OK CACHE)
+unset(_SSSE3_TRUE)
+unset(_SSSE3_OK)
+unset(_SSSE3_OK CACHE)
+unset(_SSE4_1_TRUE)
+unset(_SSE41_OK)
+unset(_SSE41_OK CACHE)
+unset(_SSE4_2_TRUE)
+unset(_SSE42_OK)
+unset(_SSE42_OK CACHE)
+unset(_AVX_TRUE)
+unset(_AVX_OK)
+unset(_AVX_OK CACHE)
+unset(_AVX2_TRUE)
+unset(_AVX2_OK)
+unset(_AVX2_OK CACHE)
+