diff options
author | Craig Topper <craig.topper@gmail.com> | 2011-12-29 16:10:46 +0000 |
---|---|---|
committer | Craig Topper <craig.topper@gmail.com> | 2011-12-29 16:10:46 +0000 |
commit | e14e08b2552b43d81a295401ddf9b8da2c499233 (patch) | |
tree | a6098ab9acaa1e14ae5a8d5b6d088bfa7c922c05 /lib | |
parent | 63d32bdf895e1ad8cfeef8e634a84fe136215202 (diff) |
Add popcnt feature flag to match gcc. This flag is implied when sse42 is enabled, but can be disabled separately. Move popcnt intrinsics to popcntintrin.h to match gcc.
git-svn-id: https://llvm.org/svn/llvm-project/cfe/trunk@147340 91177308-0d34-0410-b5e6-96231b3b80d8
Diffstat (limited to 'lib')
-rw-r--r-- | lib/Basic/Targets.cpp | 23 | ||||
-rw-r--r-- | lib/Headers/popcntintrin.h | 45 | ||||
-rw-r--r-- | lib/Headers/smmintrin.h | 17 | ||||
-rw-r--r-- | lib/Headers/x86intrin.h | 6 |
4 files changed, 72 insertions, 19 deletions
diff --git a/lib/Basic/Targets.cpp b/lib/Basic/Targets.cpp index bb1051d740..a768226b40 100644 --- a/lib/Basic/Targets.cpp +++ b/lib/Basic/Targets.cpp @@ -1198,6 +1198,7 @@ class X86TargetInfo : public TargetInfo { bool HasLZCNT; bool HasBMI; bool HasBMI2; + bool HasPOPCNT; /// \brief Enumeration of all of the X86 CPUs supported by Clang. /// @@ -1335,7 +1336,7 @@ public: X86TargetInfo(const std::string& triple) : TargetInfo(triple), SSELevel(NoSSE), MMX3DNowLevel(NoMMX3DNow), HasAES(false), HasAVX(false), HasAVX2(false), HasLZCNT(false), - HasBMI(false), HasBMI2(false), CPU(CK_Generic) { + HasBMI(false), HasBMI2(false), HasPOPCNT(false), CPU(CK_Generic) { BigEndian = false; LongDoubleFormat = &llvm::APFloat::x87DoubleExtended; } @@ -1519,6 +1520,7 @@ void X86TargetInfo::getDefaultFeatures(llvm::StringMap<bool> &Features) const { Features["lzcnt"] = false; Features["bmi"] = false; Features["bmi2"] = false; + Features["popcnt"] = false; // FIXME: This *really* should not be here. @@ -1669,7 +1671,8 @@ bool X86TargetInfo::setFeatureEnabled(llvm::StringMap<bool> &Features, Features["ssse3"] = true; else if (Name == "sse4" || Name == "sse4.2") Features["mmx"] = Features["sse"] = Features["sse2"] = Features["sse3"] = - Features["ssse3"] = Features["sse41"] = Features["sse42"] = true; + Features["ssse3"] = Features["sse41"] = Features["sse42"] = + Features["popcnt"] = true; else if (Name == "sse4.1") Features["mmx"] = Features["sse"] = Features["sse2"] = Features["sse3"] = Features["ssse3"] = Features["sse41"] = true; @@ -1682,11 +1685,11 @@ bool X86TargetInfo::setFeatureEnabled(llvm::StringMap<bool> &Features, else if (Name == "avx") Features["mmx"] = Features["sse"] = Features["sse2"] = Features["sse3"] = Features["ssse3"] = Features["sse41"] = Features["sse42"] = - Features["avx"] = true; + Features["popcnt"] = Features["avx"] = true; else if (Name == "avx2") Features["mmx"] = Features["sse"] = Features["sse2"] = Features["sse3"] = Features["ssse3"] = Features["sse41"] = Features["sse42"] = - Features["avx"] = Features["avx2"] = true; + Features["popcnt"] = Features["avx"] = Features["avx2"] = true; else if (Name == "sse4a") Features["mmx"] = Features["sse4a"] = true; else if (Name == "lzcnt") @@ -1695,6 +1698,8 @@ bool X86TargetInfo::setFeatureEnabled(llvm::StringMap<bool> &Features, Features["bmi"] = true; else if (Name == "bmi2") Features["bmi2"] = true; + else if (Name == "popcnt") + Features["popcnt"] = true; } else { if (Name == "mmx") Features["mmx"] = Features["3dnow"] = Features["3dnowa"] = false; @@ -1731,6 +1736,8 @@ bool X86TargetInfo::setFeatureEnabled(llvm::StringMap<bool> &Features, Features["bmi"] = false; else if (Name == "bmi2") Features["bmi2"] = false; + else if (Name == "popcnt") + Features["popcnt"] = false; } return true; @@ -1765,6 +1772,11 @@ void X86TargetInfo::HandleTargetFeatures(std::vector<std::string> &Features) { continue; } + if (Features[i].substr(1) == "popcnt") { + HasPOPCNT = true; + continue; + } + // FIXME: Not sure yet how to treat AVX in regard to SSE levels. // For now let it be enabled together with other SSE levels. if (Features[i].substr(1) == "avx2") { @@ -1996,6 +2008,9 @@ void X86TargetInfo::getTargetDefines(const LangOptions &Opts, if (HasBMI2) Builder.defineMacro("__BMI2__"); + if (HasPOPCNT) + Builder.defineMacro("__POPCNT__"); + // Each case falls through to the previous one here. switch (SSELevel) { case SSE42: diff --git a/lib/Headers/popcntintrin.h b/lib/Headers/popcntintrin.h new file mode 100644 index 0000000000..d439daa8d6 --- /dev/null +++ b/lib/Headers/popcntintrin.h @@ -0,0 +1,45 @@ +/*===---- popcntintrin.h - POPCNT intrinsics -------------------------------=== + * + * Permission is hereby granted, free of charge, to any person obtaining a copy + * of this software and associated documentation files (the "Software"), to deal + * in the Software without restriction, including without limitation the rights + * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell + * copies of the Software, and to permit persons to whom the Software is + * furnished to do so, subject to the following conditions: + * + * The above copyright notice and this permission notice shall be included in + * all copies or substantial portions of the Software. + * + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE + * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, + * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN + * THE SOFTWARE. + * + *===-----------------------------------------------------------------------=== + */ + +#ifndef __POPCNT__ +#error "POPCNT instruction set not enabled" +#endif + +#ifndef _POPCNTINTRIN_H +#define _POPCNTINTRIN_H + +static __inline__ int __attribute__((__always_inline__, __nodebug__)) +_mm_popcnt_u32(unsigned int __A) +{ + return __builtin_popcount(__A); +} + +#ifdef __x86_64__ +static __inline__ long long __attribute__((__always_inline__, __nodebug__)) +_mm_popcnt_u64(unsigned long long __A) +{ + return __builtin_popcountll(__A); +} +#endif /* __x86_64__ */ + +#endif /* _POPCNTINTRIN_H */ diff --git a/lib/Headers/smmintrin.h b/lib/Headers/smmintrin.h index 2e376ddb46..1ca70f8d36 100644 --- a/lib/Headers/smmintrin.h +++ b/lib/Headers/smmintrin.h @@ -428,20 +428,9 @@ _mm_crc32_u64(unsigned long long __C, unsigned long long __D) } #endif /* __x86_64__ */ -/* SSE4.2 Population Count. */ -static __inline__ int __attribute__((__always_inline__, __nodebug__)) -_mm_popcnt_u32(unsigned int __A) -{ - return __builtin_popcount(__A); -} - -#ifdef __x86_64__ -static __inline__ long long __attribute__((__always_inline__, __nodebug__)) -_mm_popcnt_u64(unsigned long long __A) -{ - return __builtin_popcountll(__A); -} -#endif /* __x86_64__ */ +#ifdef __POPCNT__ +#include <popcntintrin.h> +#endif #endif /* __SSE4_2__ */ #endif /* __SSE4_1__ */ diff --git a/lib/Headers/x86intrin.h b/lib/Headers/x86intrin.h index e64ee37413..181330d0bb 100644 --- a/lib/Headers/x86intrin.h +++ b/lib/Headers/x86intrin.h @@ -38,6 +38,10 @@ #include <lzcntintrin.h> #endif -// FIXME: SSE4A, 3dNOW, FMA4, XOP, LWP, ABM, POPCNT +#ifdef __POPCNT__ +#include <popcntintrin.h> +#endif + +// FIXME: SSE4A, 3dNOW, FMA4, XOP, LWP, ABM #endif /* __X86INTRIN_H */ |