forked from OSchip/llvm-project
Add popcnt feature flag to match gcc. This flag is implied when sse42 is enabled, but can be disabled separately. Move popcnt intrinsics to popcntintrin.h to match gcc.
llvm-svn: 147340
This commit is contained in:
parent
7bd3305f3e
commit
1de8348db7
|
@ -615,6 +615,7 @@ def mno_avx2 : Flag<"-mno-avx2">, Group<m_x86_Features_Group>;
|
|||
def mno_lzcnt : Flag<"-mno-lzcnt">, Group<m_x86_Features_Group>;
|
||||
def mno_bmi : Flag<"-mno-bmi">, Group<m_x86_Features_Group>;
|
||||
def mno_bmi2 : Flag<"-mno-bmi2">, Group<m_x86_Features_Group>;
|
||||
def mno_popcnt : Flag<"-mno-popcnt">, Group<m_x86_Features_Group>;
|
||||
|
||||
def mno_thumb : Flag<"-mno-thumb">, Group<m_Group>;
|
||||
def marm : Flag<"-marm">, Alias<mno_thumb>;
|
||||
|
@ -643,6 +644,7 @@ def mavx2 : Flag<"-mavx2">, Group<m_x86_Features_Group>;
|
|||
def mlzcnt : Flag<"-mlzcnt">, Group<m_x86_Features_Group>;
|
||||
def mbmi : Flag<"-mbmi">, Group<m_x86_Features_Group>;
|
||||
def mbmi2 : Flag<"-mbmi2">, Group<m_x86_Features_Group>;
|
||||
def mpopcnt : Flag<"-mpopcnt">, Group<m_x86_Features_Group>;
|
||||
def mthumb : Flag<"-mthumb">, Group<m_Group>;
|
||||
def mtune_EQ : Joined<"-mtune=">, Group<m_Group>;
|
||||
def multi__module : Flag<"-multi_module">;
|
||||
|
|
|
@ -1198,6 +1198,7 @@ class X86TargetInfo : public TargetInfo {
|
|||
bool HasLZCNT;
|
||||
bool HasBMI;
|
||||
bool HasBMI2;
|
||||
bool HasPOPCNT;
|
||||
|
||||
/// \brief Enumeration of all of the X86 CPUs supported by Clang.
|
||||
///
|
||||
|
@ -1335,7 +1336,7 @@ public:
|
|||
X86TargetInfo(const std::string& triple)
|
||||
: TargetInfo(triple), SSELevel(NoSSE), MMX3DNowLevel(NoMMX3DNow),
|
||||
HasAES(false), HasAVX(false), HasAVX2(false), HasLZCNT(false),
|
||||
HasBMI(false), HasBMI2(false), CPU(CK_Generic) {
|
||||
HasBMI(false), HasBMI2(false), HasPOPCNT(false), CPU(CK_Generic) {
|
||||
BigEndian = false;
|
||||
LongDoubleFormat = &llvm::APFloat::x87DoubleExtended;
|
||||
}
|
||||
|
@ -1519,6 +1520,7 @@ void X86TargetInfo::getDefaultFeatures(llvm::StringMap<bool> &Features) const {
|
|||
Features["lzcnt"] = false;
|
||||
Features["bmi"] = false;
|
||||
Features["bmi2"] = false;
|
||||
Features["popcnt"] = false;
|
||||
|
||||
// FIXME: This *really* should not be here.
|
||||
|
||||
|
@ -1669,7 +1671,8 @@ bool X86TargetInfo::setFeatureEnabled(llvm::StringMap<bool> &Features,
|
|||
Features["ssse3"] = true;
|
||||
else if (Name == "sse4" || Name == "sse4.2")
|
||||
Features["mmx"] = Features["sse"] = Features["sse2"] = Features["sse3"] =
|
||||
Features["ssse3"] = Features["sse41"] = Features["sse42"] = true;
|
||||
Features["ssse3"] = Features["sse41"] = Features["sse42"] =
|
||||
Features["popcnt"] = true;
|
||||
else if (Name == "sse4.1")
|
||||
Features["mmx"] = Features["sse"] = Features["sse2"] = Features["sse3"] =
|
||||
Features["ssse3"] = Features["sse41"] = true;
|
||||
|
@ -1682,11 +1685,11 @@ bool X86TargetInfo::setFeatureEnabled(llvm::StringMap<bool> &Features,
|
|||
else if (Name == "avx")
|
||||
Features["mmx"] = Features["sse"] = Features["sse2"] = Features["sse3"] =
|
||||
Features["ssse3"] = Features["sse41"] = Features["sse42"] =
|
||||
Features["avx"] = true;
|
||||
Features["popcnt"] = Features["avx"] = true;
|
||||
else if (Name == "avx2")
|
||||
Features["mmx"] = Features["sse"] = Features["sse2"] = Features["sse3"] =
|
||||
Features["ssse3"] = Features["sse41"] = Features["sse42"] =
|
||||
Features["avx"] = Features["avx2"] = true;
|
||||
Features["popcnt"] = Features["avx"] = Features["avx2"] = true;
|
||||
else if (Name == "sse4a")
|
||||
Features["mmx"] = Features["sse4a"] = true;
|
||||
else if (Name == "lzcnt")
|
||||
|
@ -1695,6 +1698,8 @@ bool X86TargetInfo::setFeatureEnabled(llvm::StringMap<bool> &Features,
|
|||
Features["bmi"] = true;
|
||||
else if (Name == "bmi2")
|
||||
Features["bmi2"] = true;
|
||||
else if (Name == "popcnt")
|
||||
Features["popcnt"] = true;
|
||||
} else {
|
||||
if (Name == "mmx")
|
||||
Features["mmx"] = Features["3dnow"] = Features["3dnowa"] = false;
|
||||
|
@ -1731,6 +1736,8 @@ bool X86TargetInfo::setFeatureEnabled(llvm::StringMap<bool> &Features,
|
|||
Features["bmi"] = false;
|
||||
else if (Name == "bmi2")
|
||||
Features["bmi2"] = false;
|
||||
else if (Name == "popcnt")
|
||||
Features["popcnt"] = false;
|
||||
}
|
||||
|
||||
return true;
|
||||
|
@ -1765,6 +1772,11 @@ void X86TargetInfo::HandleTargetFeatures(std::vector<std::string> &Features) {
|
|||
continue;
|
||||
}
|
||||
|
||||
if (Features[i].substr(1) == "popcnt") {
|
||||
HasPOPCNT = true;
|
||||
continue;
|
||||
}
|
||||
|
||||
// FIXME: Not sure yet how to treat AVX in regard to SSE levels.
|
||||
// For now let it be enabled together with other SSE levels.
|
||||
if (Features[i].substr(1) == "avx2") {
|
||||
|
@ -1996,6 +2008,9 @@ void X86TargetInfo::getTargetDefines(const LangOptions &Opts,
|
|||
if (HasBMI2)
|
||||
Builder.defineMacro("__BMI2__");
|
||||
|
||||
if (HasPOPCNT)
|
||||
Builder.defineMacro("__POPCNT__");
|
||||
|
||||
// Each case falls through to the previous one here.
|
||||
switch (SSELevel) {
|
||||
case SSE42:
|
||||
|
|
|
@ -0,0 +1,45 @@
|
|||
/*===---- popcntintrin.h - POPCNT intrinsics -------------------------------===
|
||||
*
|
||||
* Permission is hereby granted, free of charge, to any person obtaining a copy
|
||||
* of this software and associated documentation files (the "Software"), to deal
|
||||
* in the Software without restriction, including without limitation the rights
|
||||
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
||||
* copies of the Software, and to permit persons to whom the Software is
|
||||
* furnished to do so, subject to the following conditions:
|
||||
*
|
||||
* The above copyright notice and this permission notice shall be included in
|
||||
* all copies or substantial portions of the Software.
|
||||
*
|
||||
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
||||
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
||||
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
||||
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
||||
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
||||
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
||||
* THE SOFTWARE.
|
||||
*
|
||||
*===-----------------------------------------------------------------------===
|
||||
*/
|
||||
|
||||
#ifndef __POPCNT__
|
||||
#error "POPCNT instruction set not enabled"
|
||||
#endif
|
||||
|
||||
#ifndef _POPCNTINTRIN_H
|
||||
#define _POPCNTINTRIN_H
|
||||
|
||||
static __inline__ int __attribute__((__always_inline__, __nodebug__))
|
||||
_mm_popcnt_u32(unsigned int __A)
|
||||
{
|
||||
return __builtin_popcount(__A);
|
||||
}
|
||||
|
||||
#ifdef __x86_64__
|
||||
static __inline__ long long __attribute__((__always_inline__, __nodebug__))
|
||||
_mm_popcnt_u64(unsigned long long __A)
|
||||
{
|
||||
return __builtin_popcountll(__A);
|
||||
}
|
||||
#endif /* __x86_64__ */
|
||||
|
||||
#endif /* _POPCNTINTRIN_H */
|
|
@ -428,20 +428,9 @@ _mm_crc32_u64(unsigned long long __C, unsigned long long __D)
|
|||
}
|
||||
#endif /* __x86_64__ */
|
||||
|
||||
/* SSE4.2 Population Count. */
|
||||
static __inline__ int __attribute__((__always_inline__, __nodebug__))
|
||||
_mm_popcnt_u32(unsigned int __A)
|
||||
{
|
||||
return __builtin_popcount(__A);
|
||||
}
|
||||
|
||||
#ifdef __x86_64__
|
||||
static __inline__ long long __attribute__((__always_inline__, __nodebug__))
|
||||
_mm_popcnt_u64(unsigned long long __A)
|
||||
{
|
||||
return __builtin_popcountll(__A);
|
||||
}
|
||||
#endif /* __x86_64__ */
|
||||
#ifdef __POPCNT__
|
||||
#include <popcntintrin.h>
|
||||
#endif
|
||||
|
||||
#endif /* __SSE4_2__ */
|
||||
#endif /* __SSE4_1__ */
|
||||
|
|
|
@ -38,6 +38,10 @@
|
|||
#include <lzcntintrin.h>
|
||||
#endif
|
||||
|
||||
// FIXME: SSE4A, 3dNOW, FMA4, XOP, LWP, ABM, POPCNT
|
||||
#ifdef __POPCNT__
|
||||
#include <popcntintrin.h>
|
||||
#endif
|
||||
|
||||
// FIXME: SSE4A, 3dNOW, FMA4, XOP, LWP, ABM
|
||||
|
||||
#endif /* __X86INTRIN_H */
|
||||
|
|
|
@ -0,0 +1,16 @@
|
|||
// RUN: %clang_cc1 %s -O3 -triple=x86_64-apple-darwin -target-feature +popcnt -emit-llvm -o - | FileCheck %s
|
||||
|
||||
// Don't include mm_malloc.h, it's system specific.
|
||||
#define __MM_MALLOC_H
|
||||
|
||||
#include <x86intrin.h>
|
||||
|
||||
unsigned int test_mm_popcnt_u32(unsigned int __X) {
|
||||
// CHECK: @llvm.ctpop.i32
|
||||
return _mm_popcnt_u32(__X);
|
||||
}
|
||||
|
||||
unsigned long long test_mm_popcnt_u64(unsigned long long __X) {
|
||||
// CHECK: @llvm.ctpop.i64
|
||||
return _mm_popcnt_u64(__X);
|
||||
}
|
Loading…
Reference in New Issue