2010-08-21 02:04:07 +08:00
|
|
|
/*===---- immintrin.h - Intel intrinsics -----------------------------------===
|
|
|
|
*
|
|
|
|
* Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
|
|
* of this software and associated documentation files (the "Software"), to deal
|
|
|
|
* in the Software without restriction, including without limitation the rights
|
|
|
|
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
|
|
* copies of the Software, and to permit persons to whom the Software is
|
|
|
|
* furnished to do so, subject to the following conditions:
|
|
|
|
*
|
|
|
|
* The above copyright notice and this permission notice shall be included in
|
|
|
|
* all copies or substantial portions of the Software.
|
|
|
|
*
|
|
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
|
|
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
|
|
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
|
|
* THE SOFTWARE.
|
|
|
|
*
|
|
|
|
*===-----------------------------------------------------------------------===
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef __IMMINTRIN_H
|
|
|
|
#define __IMMINTRIN_H
|
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__MMX__)
|
2010-08-21 02:04:07 +08:00
|
|
|
#include <mmintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2010-08-21 02:04:07 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__SSE__)
|
2010-08-21 02:04:07 +08:00
|
|
|
#include <xmmintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2010-08-21 02:04:07 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__SSE2__)
|
2010-08-21 02:04:07 +08:00
|
|
|
#include <emmintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2010-08-21 02:04:07 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__SSE3__)
|
2010-08-21 02:04:07 +08:00
|
|
|
#include <pmmintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2010-08-21 02:04:07 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__SSSE3__)
|
2010-08-21 02:04:07 +08:00
|
|
|
#include <tmmintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2010-08-21 02:04:07 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || \
|
|
|
|
(defined(__SSE4_2__) || defined(__SSE4_1__))
|
2010-08-21 02:04:07 +08:00
|
|
|
#include <smmintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2010-08-21 02:04:07 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || \
|
|
|
|
(defined(__AES__) || defined(__PCLMUL__))
|
2010-08-21 02:04:07 +08:00
|
|
|
#include <wmmintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2010-08-21 02:04:07 +08:00
|
|
|
|
2016-07-05 23:56:03 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__CLFLUSHOPT__)
|
|
|
|
#include <clflushoptintrin.h>
|
|
|
|
#endif
|
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX__)
|
2010-08-21 02:04:07 +08:00
|
|
|
#include <avxintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2010-08-21 02:04:07 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX2__)
|
2011-12-19 13:04:33 +08:00
|
|
|
#include <avx2intrin.h>
|
|
|
|
|
2015-12-03 02:41:52 +08:00
|
|
|
/* The 256-bit versions of functions in f16cintrin.h.
|
|
|
|
Intel documents these as being in immintrin.h, and
|
|
|
|
they depend on typedefs from avxintrin.h. */
|
|
|
|
|
|
|
|
#define _mm256_cvtps_ph(a, imm) __extension__ ({ \
|
|
|
|
(__m128i)__builtin_ia32_vcvtps2ph256((__v8sf)(__m256)(a), (imm)); })
|
|
|
|
|
|
|
|
static __inline __m256 __attribute__((__always_inline__, __nodebug__, __target__("f16c")))
|
|
|
|
_mm256_cvtph_ps(__m128i __a)
|
|
|
|
{
|
|
|
|
return (__m256)__builtin_ia32_vcvtph2ps256((__v8hi)__a);
|
|
|
|
}
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif /* __AVX2__ */
|
2015-12-03 02:41:52 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__BMI__)
|
2011-12-25 14:25:37 +08:00
|
|
|
#include <bmiintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2011-12-25 14:25:37 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__BMI2__)
|
2011-12-26 10:31:10 +08:00
|
|
|
#include <bmi2intrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2011-12-26 10:31:10 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__LZCNT__)
|
2011-12-25 14:25:37 +08:00
|
|
|
#include <lzcntintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2011-12-25 14:25:37 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__FMA__)
|
2012-06-04 11:42:47 +08:00
|
|
|
#include <fmaintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2012-06-04 11:42:47 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512F__)
|
2014-07-22 19:31:39 +08:00
|
|
|
#include <avx512fintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2014-07-22 19:31:39 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512VL__)
|
2014-10-09 01:18:13 +08:00
|
|
|
#include <avx512vlintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2014-10-09 01:18:13 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512BW__)
|
2014-10-09 01:18:13 +08:00
|
|
|
#include <avx512bwintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2014-10-09 01:18:13 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512CD__)
|
2015-06-29 20:51:53 +08:00
|
|
|
#include <avx512cdintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2015-06-29 20:51:53 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512DQ__)
|
2015-04-30 17:24:29 +08:00
|
|
|
#include <avx512dqintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2015-04-30 17:24:29 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || \
|
|
|
|
(defined(__AVX512VL__) && defined(__AVX512BW__))
|
2014-10-09 01:18:13 +08:00
|
|
|
#include <avx512vlbwintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2014-10-09 01:18:13 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || \
|
|
|
|
(defined(__AVX512VL__) && defined(__AVX512CD__))
|
2016-04-27 19:43:14 +08:00
|
|
|
#include <avx512vlcdintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2016-04-27 19:43:14 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || \
|
|
|
|
(defined(__AVX512VL__) && defined(__AVX512DQ__))
|
2015-04-30 17:24:29 +08:00
|
|
|
#include <avx512vldqintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2015-04-30 17:24:29 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512ER__)
|
2014-07-22 19:31:39 +08:00
|
|
|
#include <avx512erintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2014-07-22 19:31:39 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512IFMA__)
|
2016-03-07 17:55:55 +08:00
|
|
|
#include <avx512ifmaintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2016-03-07 17:55:55 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || \
|
|
|
|
(defined(__AVX512IFMA__) && defined(__AVX512VL__))
|
2016-03-07 17:55:55 +08:00
|
|
|
#include <avx512ifmavlintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2016-03-07 17:55:55 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512VBMI__)
|
2016-03-08 01:04:11 +08:00
|
|
|
#include <avx512vbmiintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2016-03-08 01:04:11 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || \
|
|
|
|
(defined(__AVX512VBMI__) && defined(__AVX512VL__))
|
2016-03-08 01:04:11 +08:00
|
|
|
#include <avx512vbmivlintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2016-03-08 01:04:11 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512PF__)
|
2016-04-21 20:47:27 +08:00
|
|
|
#include <avx512pfintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2016-04-21 20:47:27 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__PKU__)
|
2015-12-31 22:14:07 +08:00
|
|
|
#include <pkuintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2015-12-31 22:14:07 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__RDRND__)
|
2015-06-17 15:09:32 +08:00
|
|
|
static __inline__ int __attribute__((__always_inline__, __nodebug__, __target__("rdrnd")))
|
2012-07-12 17:33:03 +08:00
|
|
|
_rdrand16_step(unsigned short *__p)
|
|
|
|
{
|
|
|
|
return __builtin_ia32_rdrand16_step(__p);
|
|
|
|
}
|
|
|
|
|
2015-06-17 15:09:32 +08:00
|
|
|
static __inline__ int __attribute__((__always_inline__, __nodebug__, __target__("rdrnd")))
|
2012-07-12 17:33:03 +08:00
|
|
|
_rdrand32_step(unsigned int *__p)
|
|
|
|
{
|
|
|
|
return __builtin_ia32_rdrand32_step(__p);
|
|
|
|
}
|
|
|
|
|
2016-06-01 20:21:00 +08:00
|
|
|
/* __bit_scan_forward */
|
|
|
|
static __inline__ int __attribute__((__always_inline__, __nodebug__))
|
|
|
|
_bit_scan_forward(int __A) {
|
2016-06-14 01:26:16 +08:00
|
|
|
return __builtin_ctz(__A);
|
2016-06-01 20:21:00 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/* __bit_scan_reverse */
|
|
|
|
static __inline__ int __attribute__((__always_inline__, __nodebug__))
|
|
|
|
_bit_scan_reverse(int __A) {
|
2016-06-14 01:26:16 +08:00
|
|
|
return 31 - __builtin_clz(__A);
|
2016-06-01 20:21:00 +08:00
|
|
|
}
|
|
|
|
|
2012-07-12 17:33:03 +08:00
|
|
|
#ifdef __x86_64__
|
2015-06-17 15:09:32 +08:00
|
|
|
static __inline__ int __attribute__((__always_inline__, __nodebug__, __target__("rdrnd")))
|
2012-07-12 17:33:03 +08:00
|
|
|
_rdrand64_step(unsigned long long *__p)
|
|
|
|
{
|
|
|
|
return __builtin_ia32_rdrand64_step(__p);
|
|
|
|
}
|
|
|
|
#endif
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif /* __RDRND__ */
|
2012-07-12 17:33:03 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__FSGSBASE__)
|
2014-11-03 14:51:41 +08:00
|
|
|
#ifdef __x86_64__
|
2015-06-17 15:09:32 +08:00
|
|
|
static __inline__ unsigned int __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
|
2014-11-03 14:51:41 +08:00
|
|
|
_readfsbase_u32(void)
|
|
|
|
{
|
|
|
|
return __builtin_ia32_rdfsbase32();
|
|
|
|
}
|
|
|
|
|
2015-06-17 15:09:32 +08:00
|
|
|
static __inline__ unsigned long long __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
|
2014-11-03 14:51:41 +08:00
|
|
|
_readfsbase_u64(void)
|
|
|
|
{
|
|
|
|
return __builtin_ia32_rdfsbase64();
|
|
|
|
}
|
|
|
|
|
2015-06-17 15:09:32 +08:00
|
|
|
static __inline__ unsigned int __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
|
2014-11-03 14:51:41 +08:00
|
|
|
_readgsbase_u32(void)
|
|
|
|
{
|
|
|
|
return __builtin_ia32_rdgsbase32();
|
|
|
|
}
|
|
|
|
|
2015-06-17 15:09:32 +08:00
|
|
|
static __inline__ unsigned long long __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
|
2014-11-03 14:51:41 +08:00
|
|
|
_readgsbase_u64(void)
|
|
|
|
{
|
|
|
|
return __builtin_ia32_rdgsbase64();
|
|
|
|
}
|
|
|
|
|
2015-06-17 15:09:32 +08:00
|
|
|
static __inline__ void __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
|
2014-11-03 14:51:41 +08:00
|
|
|
_writefsbase_u32(unsigned int __V)
|
|
|
|
{
|
|
|
|
return __builtin_ia32_wrfsbase32(__V);
|
|
|
|
}
|
|
|
|
|
2015-06-17 15:09:32 +08:00
|
|
|
static __inline__ void __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
|
2014-11-03 14:51:41 +08:00
|
|
|
_writefsbase_u64(unsigned long long __V)
|
|
|
|
{
|
|
|
|
return __builtin_ia32_wrfsbase64(__V);
|
|
|
|
}
|
|
|
|
|
2015-06-17 15:09:32 +08:00
|
|
|
static __inline__ void __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
|
2014-11-03 14:51:41 +08:00
|
|
|
_writegsbase_u32(unsigned int __V)
|
|
|
|
{
|
|
|
|
return __builtin_ia32_wrgsbase32(__V);
|
|
|
|
}
|
|
|
|
|
2015-06-17 15:09:32 +08:00
|
|
|
static __inline__ void __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
|
2014-11-03 14:51:41 +08:00
|
|
|
_writegsbase_u64(unsigned long long __V)
|
|
|
|
{
|
|
|
|
return __builtin_ia32_wrgsbase64(__V);
|
|
|
|
}
|
2016-06-01 20:21:00 +08:00
|
|
|
|
2014-11-03 14:51:41 +08:00
|
|
|
#endif
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif /* __FSGSBASE__ */
|
2014-11-03 14:51:41 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__RTM__)
|
2012-11-10 13:17:46 +08:00
|
|
|
#include <rtmintrin.h>
|
2015-06-18 02:42:07 +08:00
|
|
|
#include <xtestintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2013-03-29 13:14:06 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__SHA__)
|
2013-09-19 22:00:22 +08:00
|
|
|
#include <shaintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2013-09-19 22:00:22 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__FXSR__)
|
2015-06-30 17:45:38 +08:00
|
|
|
#include <fxsrintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2015-06-30 17:45:38 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__XSAVE__)
|
2015-10-13 20:29:35 +08:00
|
|
|
#include <xsaveintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2015-10-13 20:29:35 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__XSAVEOPT__)
|
2015-10-13 20:29:35 +08:00
|
|
|
#include <xsaveoptintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2015-10-13 20:29:35 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__XSAVEC__)
|
2015-10-13 20:29:35 +08:00
|
|
|
#include <xsavecintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2015-10-13 20:29:35 +08:00
|
|
|
|
2016-05-17 02:14:07 +08:00
|
|
|
#if !defined(_MSC_VER) || __has_feature(modules) || defined(__XSAVES__)
|
2015-10-13 20:29:35 +08:00
|
|
|
#include <xsavesintrin.h>
|
2016-05-17 02:14:07 +08:00
|
|
|
#endif
|
2015-10-13 20:29:35 +08:00
|
|
|
|
2015-06-18 02:42:03 +08:00
|
|
|
/* Some intrinsics inside adxintrin.h are available only on processors with ADX,
|
|
|
|
* whereas others are also available at all times. */
|
2014-09-19 18:17:06 +08:00
|
|
|
#include <adxintrin.h>
|
|
|
|
|
2010-08-21 02:04:07 +08:00
|
|
|
#endif /* __IMMINTRIN_H */
|