302 lines
8.7 KiB
C++
302 lines
8.7 KiB
C++
// Copyright 2020 Google LLC
|
|
// SPDX-License-Identifier: Apache-2.0
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
#ifndef HIGHWAY_HWY_DETECT_COMPILER_ARCH_H_
|
|
#define HIGHWAY_HWY_DETECT_COMPILER_ARCH_H_
|
|
|
|
// Detects compiler and arch from predefined macros. Zero dependencies for
|
|
// inclusion by foreach_target.h.
|
|
|
|
// Add to #if conditions to prevent IDE from graying out code.
|
|
#if (defined __CDT_PARSER__) || (defined __INTELLISENSE__) || \
|
|
(defined Q_CREATOR_RUN) || (defined __CLANGD__) || \
|
|
(defined GROK_ELLIPSIS_BUILD)
|
|
#define HWY_IDE 1
|
|
#else
|
|
#define HWY_IDE 0
|
|
#endif
|
|
|
|
//------------------------------------------------------------------------------
|
|
// Compiler
|
|
|
|
// Actual MSVC, not clang-cl, which defines _MSC_VER but doesn't behave like
|
|
// MSVC in other aspects (e.g. HWY_DIAGNOSTICS).
|
|
#if defined(_MSC_VER) && !defined(__clang__)
|
|
#define HWY_COMPILER_MSVC _MSC_VER
|
|
#else
|
|
#define HWY_COMPILER_MSVC 0
|
|
#endif
|
|
|
|
#if defined(_MSC_VER) && defined(__clang__)
|
|
#define HWY_COMPILER_CLANGCL _MSC_VER
|
|
#else
|
|
#define HWY_COMPILER_CLANGCL 0
|
|
#endif
|
|
|
|
#ifdef __INTEL_COMPILER
|
|
#define HWY_COMPILER_ICC __INTEL_COMPILER
|
|
#else
|
|
#define HWY_COMPILER_ICC 0
|
|
#endif
|
|
|
|
#ifdef __INTEL_LLVM_COMPILER
|
|
#define HWY_COMPILER_ICX __INTEL_LLVM_COMPILER
|
|
#else
|
|
#define HWY_COMPILER_ICX 0
|
|
#endif
|
|
|
|
// HWY_COMPILER_GCC is a generic macro for all compilers implementing the GNU
|
|
// compiler extensions (eg. Clang, Intel...)
|
|
#ifdef __GNUC__
|
|
#define HWY_COMPILER_GCC (__GNUC__ * 100 + __GNUC_MINOR__)
|
|
#else
|
|
#define HWY_COMPILER_GCC 0
|
|
#endif
|
|
|
|
// Clang or clang-cl, not GCC.
|
|
#ifdef __clang__
|
|
// In case of Apple LLVM (whose version number is unrelated to that of LLVM) or
|
|
// an invalid version number, deduce it from the presence of warnings.
|
|
// Originally based on
|
|
// https://github.com/simd-everywhere/simde/blob/47d6e603de9d04ee05cdfbc57cf282a02be1bf2a/simde/simde-detect-clang.h#L59.
|
|
// Please send updates below to them as well, thanks!
|
|
#if defined(__apple_build_version__) || __clang_major__ >= 999
|
|
#if __has_attribute(unsafe_buffer_usage) // no new warnings in 17.0
|
|
#define HWY_COMPILER_CLANG 1700
|
|
#elif __has_attribute(nouwtable) // no new warnings in 16.0
|
|
#define HWY_COMPILER_CLANG 1600
|
|
#elif __has_warning("-Warray-parameter")
|
|
#define HWY_COMPILER_CLANG 1500
|
|
#elif __has_warning("-Wbitwise-instead-of-logical")
|
|
#define HWY_COMPILER_CLANG 1400
|
|
#elif __has_warning("-Wreserved-identifier")
|
|
#define HWY_COMPILER_CLANG 1300
|
|
#elif __has_warning("-Wformat-insufficient-args")
|
|
#define HWY_COMPILER_CLANG 1200
|
|
#elif __has_warning("-Wimplicit-const-int-float-conversion")
|
|
#define HWY_COMPILER_CLANG 1100
|
|
#elif __has_warning("-Wmisleading-indentation")
|
|
#define HWY_COMPILER_CLANG 1000
|
|
#elif defined(__FILE_NAME__)
|
|
#define HWY_COMPILER_CLANG 900
|
|
#elif __has_warning("-Wextra-semi-stmt") || \
|
|
__has_builtin(__builtin_rotateleft32)
|
|
#define HWY_COMPILER_CLANG 800
|
|
// For reasons unknown, XCode 10.3 (Apple LLVM version 10.0.1) is apparently
|
|
// based on Clang 7, but does not support the warning we test.
|
|
// See https://en.wikipedia.org/wiki/Xcode#Toolchain_versions and
|
|
// https://trac.macports.org/wiki/XcodeVersionInfo.
|
|
#elif __has_warning("-Wc++98-compat-extra-semi") || \
|
|
(defined(__apple_build_version__) && __apple_build_version__ >= 10010000)
|
|
#define HWY_COMPILER_CLANG 700
|
|
#else // Anything older than 7.0 is not recommended for Highway.
|
|
#define HWY_COMPILER_CLANG 600
|
|
#endif // __has_warning chain
|
|
#define HWY_COMPILER3_CLANG (HWY_COMPILER_CLANG * 100)
|
|
#else // use normal version
|
|
#define HWY_COMPILER_CLANG (__clang_major__ * 100 + __clang_minor__)
|
|
#define HWY_COMPILER3_CLANG \
|
|
(__clang_major__ * 10000 + __clang_minor__ * 100 + __clang_patchlevel__)
|
|
#endif
|
|
#else // Not clang
|
|
#define HWY_COMPILER_CLANG 0
|
|
#define HWY_COMPILER3_CLANG 0
|
|
#endif
|
|
|
|
#if HWY_COMPILER_GCC && !HWY_COMPILER_CLANG && !HWY_COMPILER_ICC
|
|
#define HWY_COMPILER_GCC_ACTUAL HWY_COMPILER_GCC
|
|
#else
|
|
#define HWY_COMPILER_GCC_ACTUAL 0
|
|
#endif
|
|
|
|
// More than one may be nonzero, but we want at least one.
|
|
#if 0 == (HWY_COMPILER_MSVC + HWY_COMPILER_CLANGCL + HWY_COMPILER_ICC + \
|
|
HWY_COMPILER_GCC + HWY_COMPILER_CLANG)
|
|
#error "Unsupported compiler"
|
|
#endif
|
|
|
|
// We should only detect one of these (only clang/clangcl overlap)
|
|
#if 1 < \
|
|
(!!HWY_COMPILER_MSVC + !!HWY_COMPILER_ICC + !!HWY_COMPILER_GCC_ACTUAL + \
|
|
!!(HWY_COMPILER_CLANGCL | HWY_COMPILER_CLANG))
|
|
#error "Detected multiple compilers"
|
|
#endif
|
|
|
|
#ifdef __has_builtin
|
|
#define HWY_HAS_BUILTIN(name) __has_builtin(name)
|
|
#else
|
|
#define HWY_HAS_BUILTIN(name) 0
|
|
#endif
|
|
|
|
#ifdef __has_attribute
|
|
#define HWY_HAS_ATTRIBUTE(name) __has_attribute(name)
|
|
#else
|
|
#define HWY_HAS_ATTRIBUTE(name) 0
|
|
#endif
|
|
|
|
#ifdef __has_cpp_attribute
|
|
#define HWY_HAS_CPP_ATTRIBUTE(name) __has_cpp_attribute(name)
|
|
#else
|
|
#define HWY_HAS_CPP_ATTRIBUTE(name) 0
|
|
#endif
|
|
|
|
#ifdef __has_feature
|
|
#define HWY_HAS_FEATURE(name) __has_feature(name)
|
|
#else
|
|
#define HWY_HAS_FEATURE(name) 0
|
|
#endif
|
|
|
|
//------------------------------------------------------------------------------
|
|
// Architecture
|
|
|
|
#if defined(__i386__) || defined(_M_IX86)
|
|
#define HWY_ARCH_X86_32 1
|
|
#else
|
|
#define HWY_ARCH_X86_32 0
|
|
#endif
|
|
|
|
#if defined(__x86_64__) || defined(_M_X64)
|
|
#define HWY_ARCH_X86_64 1
|
|
#else
|
|
#define HWY_ARCH_X86_64 0
|
|
#endif
|
|
|
|
#if HWY_ARCH_X86_32 && HWY_ARCH_X86_64
|
|
#error "Cannot have both x86-32 and x86-64"
|
|
#endif
|
|
|
|
#if HWY_ARCH_X86_32 || HWY_ARCH_X86_64
|
|
#define HWY_ARCH_X86 1
|
|
#else
|
|
#define HWY_ARCH_X86 0
|
|
#endif
|
|
|
|
#if defined(__powerpc64__) || defined(_M_PPC) || defined(__powerpc__)
|
|
#define HWY_ARCH_PPC 1
|
|
#else
|
|
#define HWY_ARCH_PPC 0
|
|
#endif
|
|
|
|
#if defined(__powerpc64__) || (HWY_ARCH_PPC && defined(__64BIT__))
|
|
#define HWY_ARCH_PPC_64 1
|
|
#else
|
|
#define HWY_ARCH_PPC_64 0
|
|
#endif
|
|
|
|
// aarch32 is currently not supported; please raise an issue if you want it.
|
|
#if defined(__ARM_ARCH_ISA_A64) || defined(__aarch64__) || defined(_M_ARM64)
|
|
#define HWY_ARCH_ARM_A64 1
|
|
#else
|
|
#define HWY_ARCH_ARM_A64 0
|
|
#endif
|
|
|
|
#if (defined(__ARM_ARCH) && __ARM_ARCH == 7) || (defined(_M_ARM) && _M_ARM == 7)
|
|
#define HWY_ARCH_ARM_V7 1
|
|
#else
|
|
#define HWY_ARCH_ARM_V7 0
|
|
#endif
|
|
|
|
#if HWY_ARCH_ARM_A64 && HWY_ARCH_ARM_V7
|
|
#error "Cannot have both A64 and V7"
|
|
#endif
|
|
|
|
// Any *supported* version of Arm, i.e. 7 or later
|
|
#if HWY_ARCH_ARM_A64 || HWY_ARCH_ARM_V7
|
|
#define HWY_ARCH_ARM 1
|
|
#else
|
|
#define HWY_ARCH_ARM 0
|
|
#endif
|
|
|
|
// Older than Armv7 (e.g. armel aka Armv5) => we do not support SIMD.
|
|
#if (defined(__arm__) || defined(_M_ARM)) && !HWY_ARCH_ARM
|
|
#define HWY_ARCH_ARM_OLD 1
|
|
#else
|
|
#define HWY_ARCH_ARM_OLD 0
|
|
#endif
|
|
|
|
#if defined(__EMSCRIPTEN__) || defined(__wasm__) || defined(__WASM__)
|
|
#define HWY_ARCH_WASM 1
|
|
#else
|
|
#define HWY_ARCH_WASM 0
|
|
#endif
|
|
|
|
#ifdef __riscv
|
|
#define HWY_ARCH_RVV 1
|
|
#else
|
|
#define HWY_ARCH_RVV 0
|
|
#endif
|
|
|
|
#if defined(__s390x__)
|
|
#define HWY_ARCH_S390X 1
|
|
#else
|
|
#define HWY_ARCH_S390X 0
|
|
#endif
|
|
|
|
// It is an error to detect multiple architectures at the same time, but OK to
|
|
// detect none of the above.
|
|
#if (HWY_ARCH_X86 + HWY_ARCH_PPC + HWY_ARCH_ARM + HWY_ARCH_ARM_OLD + \
|
|
HWY_ARCH_WASM + HWY_ARCH_RVV + HWY_ARCH_S390X) > 1
|
|
#error "Must not detect more than one architecture"
|
|
#endif
|
|
|
|
#if defined(_WIN32) || defined(_WIN64)
|
|
#define HWY_OS_WIN 1
|
|
#else
|
|
#define HWY_OS_WIN 0
|
|
#endif
|
|
|
|
#if defined(linux) || defined(__linux__)
|
|
#define HWY_OS_LINUX 1
|
|
#else
|
|
#define HWY_OS_LINUX 0
|
|
#endif
|
|
|
|
// iOS or Mac
|
|
#if defined(__APPLE__)
|
|
#define HWY_OS_APPLE 1
|
|
#else
|
|
#define HWY_OS_APPLE 0
|
|
#endif
|
|
|
|
//------------------------------------------------------------------------------
|
|
// Endianness
|
|
|
|
#if HWY_COMPILER_MSVC
|
|
#if HWY_ARCH_PPC && defined(_XBOX_VER) && _XBOX_VER >= 200
|
|
// XBox 360 is big-endian
|
|
#define HWY_IS_LITTLE_ENDIAN 0
|
|
#define HWY_IS_BIG_ENDIAN 1
|
|
#else
|
|
// All other targets supported by MSVC are little-endian
|
|
#define HWY_IS_LITTLE_ENDIAN 1
|
|
#define HWY_IS_BIG_ENDIAN 0
|
|
#endif // HWY_ARCH_PPC && defined(_XBOX_VER) && _XBOX_VER >= 200
|
|
#elif defined(__BYTE_ORDER__) && defined(__ORDER_LITTLE_ENDIAN__) && \
|
|
__BYTE_ORDER__ == __ORDER_LITTLE_ENDIAN__
|
|
#define HWY_IS_LITTLE_ENDIAN 1
|
|
#define HWY_IS_BIG_ENDIAN 0
|
|
#elif defined(__BYTE_ORDER__) && defined(__ORDER_BIG_ENDIAN__) && \
|
|
__BYTE_ORDER__ == __ORDER_BIG_ENDIAN__
|
|
#define HWY_IS_LITTLE_ENDIAN 0
|
|
#define HWY_IS_BIG_ENDIAN 1
|
|
#else
|
|
#error "Unable to detect endianness or unsupported byte order"
|
|
#endif
|
|
|
|
#if (HWY_IS_LITTLE_ENDIAN + HWY_IS_BIG_ENDIAN) != 1
|
|
#error "Must only detect one byte order"
|
|
#endif
|
|
|
|
#endif // HIGHWAY_HWY_DETECT_COMPILER_ARCH_H_
|