2011-11-29 04:05:27 +08:00
|
|
|
/*===---- cpuid.h - X86 cpu model detection --------------------------------===
|
2011-11-27 04:53:19 +08:00
|
|
|
*
|
2019-04-09 04:51:30 +08:00
|
|
|
* Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
* See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
* SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
2011-11-27 04:53:19 +08:00
|
|
|
*
|
|
|
|
*===-----------------------------------------------------------------------===
|
|
|
|
*/
|
|
|
|
|
2011-11-27 23:21:33 +08:00
|
|
|
#if !(__x86_64__ || __i386__)
|
|
|
|
#error this header is for x86 only
|
|
|
|
#endif
|
|
|
|
|
2014-10-02 05:21:42 +08:00
|
|
|
/* Responses identification request with %eax 0 */
|
|
|
|
/* AMD: "AuthenticAMD" */
|
2014-10-02 05:22:17 +08:00
|
|
|
#define signature_AMD_ebx 0x68747541
|
|
|
|
#define signature_AMD_edx 0x69746e65
|
|
|
|
#define signature_AMD_ecx 0x444d4163
|
2014-10-02 05:21:42 +08:00
|
|
|
/* CENTAUR: "CentaurHauls" */
|
|
|
|
#define signature_CENTAUR_ebx 0x746e6543
|
|
|
|
#define signature_CENTAUR_edx 0x48727561
|
|
|
|
#define signature_CENTAUR_ecx 0x736c7561
|
|
|
|
/* CYRIX: "CyrixInstead" */
|
|
|
|
#define signature_CYRIX_ebx 0x69727943
|
|
|
|
#define signature_CYRIX_edx 0x736e4978
|
|
|
|
#define signature_CYRIX_ecx 0x64616574
|
|
|
|
/* INTEL: "GenuineIntel" */
|
|
|
|
#define signature_INTEL_ebx 0x756e6547
|
|
|
|
#define signature_INTEL_edx 0x49656e69
|
|
|
|
#define signature_INTEL_ecx 0x6c65746e
|
|
|
|
/* TM1: "TransmetaCPU" */
|
|
|
|
#define signature_TM1_ebx 0x6e617254
|
|
|
|
#define signature_TM1_edx 0x74656d73
|
|
|
|
#define signature_TM1_ecx 0x55504361
|
|
|
|
/* TM2: "GenuineTMx86" */
|
|
|
|
#define signature_TM2_ebx 0x756e6547
|
|
|
|
#define signature_TM2_edx 0x54656e69
|
|
|
|
#define signature_TM2_ecx 0x3638784d
|
|
|
|
/* NSC: "Geode by NSC" */
|
|
|
|
#define signature_NSC_ebx 0x646f6547
|
2019-08-10 18:14:01 +08:00
|
|
|
#define signature_NSC_edx 0x79622065
|
|
|
|
#define signature_NSC_ecx 0x43534e20
|
2014-10-02 05:21:42 +08:00
|
|
|
/* NEXGEN: "NexGenDriven" */
|
|
|
|
#define signature_NEXGEN_ebx 0x4778654e
|
|
|
|
#define signature_NEXGEN_edx 0x72446e65
|
|
|
|
#define signature_NEXGEN_ecx 0x6e657669
|
|
|
|
/* RISE: "RiseRiseRise" */
|
|
|
|
#define signature_RISE_ebx 0x65736952
|
|
|
|
#define signature_RISE_edx 0x65736952
|
|
|
|
#define signature_RISE_ecx 0x65736952
|
|
|
|
/* SIS: "SiS SiS SiS " */
|
|
|
|
#define signature_SIS_ebx 0x20536953
|
|
|
|
#define signature_SIS_edx 0x20536953
|
|
|
|
#define signature_SIS_ecx 0x20536953
|
|
|
|
/* UMC: "UMC UMC UMC " */
|
|
|
|
#define signature_UMC_ebx 0x20434d55
|
|
|
|
#define signature_UMC_edx 0x20434d55
|
|
|
|
#define signature_UMC_ecx 0x20434d55
|
|
|
|
/* VIA: "VIA VIA VIA " */
|
|
|
|
#define signature_VIA_ebx 0x20414956
|
|
|
|
#define signature_VIA_edx 0x20414956
|
|
|
|
#define signature_VIA_ecx 0x20414956
|
|
|
|
/* VORTEX: "Vortex86 SoC" */
|
|
|
|
#define signature_VORTEX_ebx 0x74726f56
|
|
|
|
#define signature_VORTEX_edx 0x36387865
|
|
|
|
#define signature_VORTEX_ecx 0x436f5320
|
|
|
|
|
2017-07-10 01:43:11 +08:00
|
|
|
/* Features in %ecx for leaf 1 */
|
2013-07-20 01:28:36 +08:00
|
|
|
#define bit_SSE3 0x00000001
|
|
|
|
#define bit_PCLMULQDQ 0x00000002
|
2016-08-01 04:23:23 +08:00
|
|
|
#define bit_PCLMUL bit_PCLMULQDQ /* for gcc compat */
|
2013-07-20 01:28:36 +08:00
|
|
|
#define bit_DTES64 0x00000004
|
|
|
|
#define bit_MONITOR 0x00000008
|
|
|
|
#define bit_DSCPL 0x00000010
|
|
|
|
#define bit_VMX 0x00000020
|
|
|
|
#define bit_SMX 0x00000040
|
|
|
|
#define bit_EIST 0x00000080
|
|
|
|
#define bit_TM2 0x00000100
|
|
|
|
#define bit_SSSE3 0x00000200
|
|
|
|
#define bit_CNXTID 0x00000400
|
|
|
|
#define bit_FMA 0x00001000
|
|
|
|
#define bit_CMPXCHG16B 0x00002000
|
|
|
|
#define bit_xTPR 0x00004000
|
|
|
|
#define bit_PDCM 0x00008000
|
|
|
|
#define bit_PCID 0x00020000
|
|
|
|
#define bit_DCA 0x00040000
|
|
|
|
#define bit_SSE41 0x00080000
|
2016-08-01 04:23:23 +08:00
|
|
|
#define bit_SSE4_1 bit_SSE41 /* for gcc compat */
|
2013-07-20 01:28:36 +08:00
|
|
|
#define bit_SSE42 0x00100000
|
2016-08-01 04:23:23 +08:00
|
|
|
#define bit_SSE4_2 bit_SSE42 /* for gcc compat */
|
2013-07-20 01:28:36 +08:00
|
|
|
#define bit_x2APIC 0x00200000
|
|
|
|
#define bit_MOVBE 0x00400000
|
|
|
|
#define bit_POPCNT 0x00800000
|
|
|
|
#define bit_TSCDeadline 0x01000000
|
|
|
|
#define bit_AESNI 0x02000000
|
2016-08-01 04:23:23 +08:00
|
|
|
#define bit_AES bit_AESNI /* for gcc compat */
|
2013-07-20 01:28:36 +08:00
|
|
|
#define bit_XSAVE 0x04000000
|
|
|
|
#define bit_OSXSAVE 0x08000000
|
|
|
|
#define bit_AVX 0x10000000
|
2016-08-01 04:23:23 +08:00
|
|
|
#define bit_F16C 0x20000000
|
2014-10-02 05:21:16 +08:00
|
|
|
#define bit_RDRND 0x40000000
|
2013-07-20 01:28:36 +08:00
|
|
|
|
2017-07-10 01:43:11 +08:00
|
|
|
/* Features in %edx for leaf 1 */
|
2013-07-20 01:28:36 +08:00
|
|
|
#define bit_FPU 0x00000001
|
|
|
|
#define bit_VME 0x00000002
|
|
|
|
#define bit_DE 0x00000004
|
|
|
|
#define bit_PSE 0x00000008
|
|
|
|
#define bit_TSC 0x00000010
|
|
|
|
#define bit_MSR 0x00000020
|
|
|
|
#define bit_PAE 0x00000040
|
|
|
|
#define bit_MCE 0x00000080
|
|
|
|
#define bit_CX8 0x00000100
|
2016-08-01 04:23:23 +08:00
|
|
|
#define bit_CMPXCHG8B bit_CX8 /* for gcc compat */
|
2013-07-20 01:28:36 +08:00
|
|
|
#define bit_APIC 0x00000200
|
|
|
|
#define bit_SEP 0x00000800
|
|
|
|
#define bit_MTRR 0x00001000
|
|
|
|
#define bit_PGE 0x00002000
|
|
|
|
#define bit_MCA 0x00004000
|
|
|
|
#define bit_CMOV 0x00008000
|
|
|
|
#define bit_PAT 0x00010000
|
|
|
|
#define bit_PSE36 0x00020000
|
|
|
|
#define bit_PSN 0x00040000
|
|
|
|
#define bit_CLFSH 0x00080000
|
|
|
|
#define bit_DS 0x00200000
|
|
|
|
#define bit_ACPI 0x00400000
|
|
|
|
#define bit_MMX 0x00800000
|
|
|
|
#define bit_FXSR 0x01000000
|
2016-08-01 04:23:23 +08:00
|
|
|
#define bit_FXSAVE bit_FXSR /* for gcc compat */
|
2013-07-20 01:28:36 +08:00
|
|
|
#define bit_SSE 0x02000000
|
|
|
|
#define bit_SSE2 0x04000000
|
|
|
|
#define bit_SS 0x08000000
|
|
|
|
#define bit_HTT 0x10000000
|
|
|
|
#define bit_TM 0x20000000
|
|
|
|
#define bit_PBE 0x80000000
|
|
|
|
|
2017-07-10 01:43:11 +08:00
|
|
|
/* Features in %ebx for leaf 7 sub-leaf 0 */
|
2013-07-20 01:28:36 +08:00
|
|
|
#define bit_FSGSBASE 0x00000001
|
2017-07-10 01:43:11 +08:00
|
|
|
#define bit_SGX 0x00000004
|
|
|
|
#define bit_BMI 0x00000008
|
|
|
|
#define bit_HLE 0x00000010
|
|
|
|
#define bit_AVX2 0x00000020
|
2013-07-20 01:28:36 +08:00
|
|
|
#define bit_SMEP 0x00000080
|
2017-07-10 01:43:11 +08:00
|
|
|
#define bit_BMI2 0x00000100
|
2013-07-20 01:28:36 +08:00
|
|
|
#define bit_ENH_MOVSB 0x00000200
|
2018-05-25 14:34:42 +08:00
|
|
|
#define bit_INVPCID 0x00000400
|
2017-07-10 01:43:11 +08:00
|
|
|
#define bit_RTM 0x00000800
|
|
|
|
#define bit_MPX 0x00004000
|
|
|
|
#define bit_AVX512F 0x00010000
|
|
|
|
#define bit_AVX512DQ 0x00020000
|
|
|
|
#define bit_RDSEED 0x00040000
|
|
|
|
#define bit_ADX 0x00080000
|
|
|
|
#define bit_AVX512IFMA 0x00200000
|
|
|
|
#define bit_CLFLUSHOPT 0x00800000
|
|
|
|
#define bit_CLWB 0x01000000
|
|
|
|
#define bit_AVX512PF 0x04000000
|
2018-03-07 00:06:44 +08:00
|
|
|
#define bit_AVX512ER 0x08000000
|
2017-07-10 01:43:11 +08:00
|
|
|
#define bit_AVX512CD 0x10000000
|
|
|
|
#define bit_SHA 0x20000000
|
|
|
|
#define bit_AVX512BW 0x40000000
|
|
|
|
#define bit_AVX512VL 0x80000000
|
|
|
|
|
|
|
|
/* Features in %ecx for leaf 7 sub-leaf 0 */
|
2017-12-20 08:46:09 +08:00
|
|
|
#define bit_PREFTCHWT1 0x00000001
|
|
|
|
#define bit_AVX512VBMI 0x00000002
|
|
|
|
#define bit_PKU 0x00000004
|
|
|
|
#define bit_OSPKE 0x00000010
|
2018-04-21 02:44:33 +08:00
|
|
|
#define bit_WAITPKG 0x00000020
|
2017-12-20 08:46:09 +08:00
|
|
|
#define bit_AVX512VBMI2 0x00000040
|
|
|
|
#define bit_SHSTK 0x00000080
|
|
|
|
#define bit_GFNI 0x00000100
|
|
|
|
#define bit_VAES 0x00000200
|
|
|
|
#define bit_VPCLMULQDQ 0x00000400
|
|
|
|
#define bit_AVX512VNNI 0x00000800
|
|
|
|
#define bit_AVX512BITALG 0x00001000
|
2017-07-10 01:43:11 +08:00
|
|
|
#define bit_AVX512VPOPCNTDQ 0x00004000
|
2017-12-20 08:46:09 +08:00
|
|
|
#define bit_RDPID 0x00400000
|
2018-04-13 15:37:24 +08:00
|
|
|
#define bit_CLDEMOTE 0x02000000
|
2018-05-01 18:05:42 +08:00
|
|
|
#define bit_MOVDIRI 0x08000000
|
|
|
|
#define bit_MOVDIR64B 0x10000000
|
2019-06-06 16:28:42 +08:00
|
|
|
#define bit_ENQCMD 0x20000000
|
2017-07-10 01:43:11 +08:00
|
|
|
|
|
|
|
/* Features in %edx for leaf 7 sub-leaf 0 */
|
|
|
|
#define bit_AVX5124VNNIW 0x00000004
|
|
|
|
#define bit_AVX5124FMAPS 0x00000008
|
2018-05-08 14:49:41 +08:00
|
|
|
#define bit_PCONFIG 0x00040000
|
2017-12-20 08:46:09 +08:00
|
|
|
#define bit_IBT 0x00100000
|
2017-07-10 01:43:11 +08:00
|
|
|
|
Enable intrinsics of AVX512_BF16, which are supported for BFLOAT16 in Cooper Lake
Summary:
1. Enable infrastructure of AVX512_BF16, which is supported for BFLOAT16 in Cooper Lake;
2. Enable intrinsics for VCVTNE2PS2BF16, VCVTNEPS2BF16 and DPBF16PS instructions, which are Vector Neural Network Instructions supporting BFLOAT16 inputs and conversion instructions from IEEE single precision.
For more details about BF16 intrinsic, please refer to the latest ISE document: https://software.intel.com/en-us/download/intel-architecture-instruction-set-extensions-programming-reference
Patch by LiuTianle
Reviewers: craig.topper, smaslov, LuoYuanke, wxiao3, annita.zhang, spatel, RKSimon
Reviewed By: craig.topper
Subscribers: mgorny, cfe-commits
Tags: #clang
Differential Revision: https://reviews.llvm.org/D60552
llvm-svn: 360018
2019-05-06 16:25:11 +08:00
|
|
|
/* Features in %eax for leaf 7 sub-leaf 1 */
|
|
|
|
#define bit_AVX512BF16 0x00000020
|
|
|
|
|
2017-07-10 01:43:11 +08:00
|
|
|
/* Features in %eax for leaf 13 sub-leaf 1 */
|
|
|
|
#define bit_XSAVEOPT 0x00000001
|
|
|
|
#define bit_XSAVEC 0x00000002
|
|
|
|
#define bit_XSAVES 0x00000008
|
|
|
|
|
2018-05-10 15:28:54 +08:00
|
|
|
/* Features in %eax for leaf 0x14 sub-leaf 0 */
|
|
|
|
#define bit_PTWRITE 0x00000010
|
|
|
|
|
2017-07-10 01:43:11 +08:00
|
|
|
/* Features in %ecx for leaf 0x80000001 */
|
|
|
|
#define bit_LAHF_LM 0x00000001
|
|
|
|
#define bit_ABM 0x00000020
|
2017-12-20 08:46:09 +08:00
|
|
|
#define bit_LZCNT bit_ABM /* for gcc compat */
|
2017-07-10 01:43:11 +08:00
|
|
|
#define bit_SSE4a 0x00000040
|
|
|
|
#define bit_PRFCHW 0x00000100
|
|
|
|
#define bit_XOP 0x00000800
|
|
|
|
#define bit_LWP 0x00008000
|
|
|
|
#define bit_FMA4 0x00010000
|
|
|
|
#define bit_TBM 0x00200000
|
|
|
|
#define bit_MWAITX 0x20000000
|
|
|
|
|
|
|
|
/* Features in %edx for leaf 0x80000001 */
|
|
|
|
#define bit_MMXEXT 0x00400000
|
|
|
|
#define bit_LM 0x20000000
|
|
|
|
#define bit_3DNOWP 0x40000000
|
|
|
|
#define bit_3DNOW 0x80000000
|
|
|
|
|
2018-04-12 04:09:09 +08:00
|
|
|
/* Features in %ebx for leaf 0x80000008 */
|
2017-07-10 01:43:11 +08:00
|
|
|
#define bit_CLZERO 0x00000001
|
2018-04-12 04:09:09 +08:00
|
|
|
#define bit_WBNOINVD 0x00000200
|
2017-07-10 01:43:11 +08:00
|
|
|
|
2013-07-20 01:28:36 +08:00
|
|
|
|
|
|
|
#if __i386__
|
2017-07-10 01:43:10 +08:00
|
|
|
#define __cpuid(__leaf, __eax, __ebx, __ecx, __edx) \
|
2014-09-20 09:31:09 +08:00
|
|
|
__asm("cpuid" : "=a"(__eax), "=b" (__ebx), "=c"(__ecx), "=d"(__edx) \
|
2017-07-10 01:43:10 +08:00
|
|
|
: "0"(__leaf))
|
2014-09-20 09:31:09 +08:00
|
|
|
|
2017-07-10 01:43:10 +08:00
|
|
|
#define __cpuid_count(__leaf, __count, __eax, __ebx, __ecx, __edx) \
|
2014-09-20 09:31:09 +08:00
|
|
|
__asm("cpuid" : "=a"(__eax), "=b" (__ebx), "=c"(__ecx), "=d"(__edx) \
|
2017-07-10 01:43:10 +08:00
|
|
|
: "0"(__leaf), "2"(__count))
|
2014-09-20 09:31:09 +08:00
|
|
|
#else
|
|
|
|
/* x86-64 uses %rbx as the base register, so preserve it. */
|
2017-07-10 01:43:10 +08:00
|
|
|
#define __cpuid(__leaf, __eax, __ebx, __ecx, __edx) \
|
2014-09-20 09:31:09 +08:00
|
|
|
__asm(" xchgq %%rbx,%q1\n" \
|
2013-07-20 01:28:36 +08:00
|
|
|
" cpuid\n" \
|
2014-09-20 09:31:09 +08:00
|
|
|
" xchgq %%rbx,%q1" \
|
2013-07-20 01:28:36 +08:00
|
|
|
: "=a"(__eax), "=r" (__ebx), "=c"(__ecx), "=d"(__edx) \
|
2017-07-10 01:43:10 +08:00
|
|
|
: "0"(__leaf))
|
2013-07-20 01:28:36 +08:00
|
|
|
|
2017-07-10 01:43:10 +08:00
|
|
|
#define __cpuid_count(__leaf, __count, __eax, __ebx, __ecx, __edx) \
|
2014-09-20 09:31:09 +08:00
|
|
|
__asm(" xchgq %%rbx,%q1\n" \
|
2013-07-20 01:28:36 +08:00
|
|
|
" cpuid\n" \
|
2014-09-20 09:31:09 +08:00
|
|
|
" xchgq %%rbx,%q1" \
|
2013-07-20 01:28:36 +08:00
|
|
|
: "=a"(__eax), "=r" (__ebx), "=c"(__ecx), "=d"(__edx) \
|
2017-07-10 01:43:10 +08:00
|
|
|
: "0"(__leaf), "2"(__count))
|
2013-07-20 01:28:36 +08:00
|
|
|
#endif
|
|
|
|
|
2017-07-10 01:43:10 +08:00
|
|
|
static __inline int __get_cpuid_max (unsigned int __leaf, unsigned int *__sig)
|
2013-07-20 01:28:36 +08:00
|
|
|
{
|
|
|
|
unsigned int __eax, __ebx, __ecx, __edx;
|
|
|
|
#if __i386__
|
|
|
|
int __cpuid_supported;
|
|
|
|
|
|
|
|
__asm(" pushfl\n"
|
|
|
|
" popl %%eax\n"
|
|
|
|
" movl %%eax,%%ecx\n"
|
|
|
|
" xorl $0x00200000,%%eax\n"
|
|
|
|
" pushl %%eax\n"
|
|
|
|
" popfl\n"
|
|
|
|
" pushfl\n"
|
|
|
|
" popl %%eax\n"
|
|
|
|
" movl $0,%0\n"
|
|
|
|
" cmpl %%eax,%%ecx\n"
|
|
|
|
" je 1f\n"
|
|
|
|
" movl $1,%0\n"
|
|
|
|
"1:"
|
|
|
|
: "=r" (__cpuid_supported) : : "eax", "ecx");
|
|
|
|
if (!__cpuid_supported)
|
|
|
|
return 0;
|
|
|
|
#endif
|
|
|
|
|
2017-07-10 01:43:10 +08:00
|
|
|
__cpuid(__leaf, __eax, __ebx, __ecx, __edx);
|
2013-07-20 01:28:36 +08:00
|
|
|
if (__sig)
|
|
|
|
*__sig = __ebx;
|
|
|
|
return __eax;
|
|
|
|
}
|
2017-07-10 01:43:10 +08:00
|
|
|
|
|
|
|
static __inline int __get_cpuid (unsigned int __leaf, unsigned int *__eax,
|
|
|
|
unsigned int *__ebx, unsigned int *__ecx,
|
|
|
|
unsigned int *__edx)
|
|
|
|
{
|
|
|
|
unsigned int __max_leaf = __get_cpuid_max(__leaf & 0x80000000, 0);
|
|
|
|
|
|
|
|
if (__max_leaf == 0 || __max_leaf < __leaf)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
__cpuid(__leaf, *__eax, *__ebx, *__ecx, *__edx);
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
static __inline int __get_cpuid_count (unsigned int __leaf,
|
|
|
|
unsigned int __subleaf,
|
|
|
|
unsigned int *__eax, unsigned int *__ebx,
|
|
|
|
unsigned int *__ecx, unsigned int *__edx)
|
|
|
|
{
|
|
|
|
unsigned int __max_leaf = __get_cpuid_max(__leaf & 0x80000000, 0);
|
|
|
|
|
|
|
|
if (__max_leaf == 0 || __max_leaf < __leaf)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
__cpuid_count(__leaf, __subleaf, *__eax, *__ebx, *__ecx, *__edx);
|
|
|
|
return 1;
|
|
|
|
}
|