llvm-project/clang/lib/Headers/f16cintrin.h

/*===---- f16cintrin.h - F16C intrinsics -----------------------------------===
 *
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in
 * all copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
 * THE SOFTWARE.
 *
 *===-----------------------------------------------------------------------===
 */

#if !defined __X86INTRIN_H && !defined __EMMINTRIN_H && !defined __IMMINTRIN_H
#error "Never use <f16cintrin.h> directly; include <emmintrin.h> instead."
#endif

#ifndef __F16CINTRIN_H
#define __F16CINTRIN_H

/* Define the default attributes for the functions in this file. */
#define __DEFAULT_FN_ATTRS \
  __attribute__((__always_inline__, __nodebug__, __target__("f16c")))

/// \brief Converts a 16-bit half-precision float value into a 32-bit float
///    value.
///
/// \headerfile <x86intrin.h>
///
/// This intrinsic corresponds to the <c> VCVTPH2PS </c> instruction.
///
/// \param __a
///    A 16-bit half-precision float value.
/// \returns The converted 32-bit float value.
static __inline float __DEFAULT_FN_ATTRS
_cvtsh_ss(unsigned short __a)
{
  __v8hi v = {(short)__a, 0, 0, 0, 0, 0, 0, 0};
  __v4sf r = __builtin_ia32_vcvtph2ps(v);
  return r[0];
}

/// \brief Converts a 32-bit single-precision float value to a 16-bit
///    half-precision float value.
///
/// \headerfile <x86intrin.h>
///
/// \code
/// unsigned short _cvtss_sh(float a, const int imm);
/// \endcode
///
/// This intrinsic corresponds to the <c> VCVTPS2PH </c> instruction.
///
/// \param a
///    A 32-bit single-precision float value to be converted to a 16-bit
///    half-precision float value.
/// \param imm
///    An immediate value controlling rounding using bits [2:0]: \n
///    000: Nearest \n
///    001: Down \n
///    010: Up \n
///    011: Truncate \n
///    1XX: Use MXCSR.RC for rounding
/// \returns The converted 16-bit half-precision float value.
#define _cvtss_sh(a, imm) __extension__ ({ \
  (unsigned short)(((__v8hi)__builtin_ia32_vcvtps2ph((__v4sf){a, 0, 0, 0}, \
                                                     (imm)))[0]); })

/// \brief Converts a 128-bit vector containing 32-bit float values into a
///    128-bit vector containing 16-bit half-precision float values.
///
/// \headerfile <x86intrin.h>
///
/// \code
/// __m128i _mm_cvtps_ph(__m128 a, const int imm);
/// \endcode
///
/// This intrinsic corresponds to the <c> VCVTPS2PH </c> instruction.
///
/// \param a
///    A 128-bit vector containing 32-bit float values.
/// \param imm
///    An immediate value controlling rounding using bits [2:0]: \n
///    000: Nearest \n
///    001: Down \n
///    010: Up \n
///    011: Truncate \n
///    1XX: Use MXCSR.RC for rounding
/// \returns A 128-bit vector containing converted 16-bit half-precision float
///    values. The lower 64 bits are used to store the converted 16-bit
///    half-precision floating-point values.
#define _mm_cvtps_ph(a, imm) __extension__ ({ \
  (__m128i)__builtin_ia32_vcvtps2ph((__v4sf)(__m128)(a), (imm)); })

/// \brief Converts a 128-bit vector containing 16-bit half-precision float
///    values into a 128-bit vector containing 32-bit float values.
///
/// \headerfile <x86intrin.h>
///
/// This intrinsic corresponds to the <c> VCVTPH2PS </c> instruction.
///
/// \param __a
///    A 128-bit vector containing 16-bit half-precision float values. The lower
///    64 bits are used in the conversion.
/// \returns A 128-bit vector of [4 x float] containing converted float values.
static __inline __m128 __DEFAULT_FN_ATTRS
_mm_cvtph_ps(__m128i __a)
{
  return (__m128)__builtin_ia32_vcvtph2ps((__v8hi)__a);
}

#undef __DEFAULT_FN_ATTRS

#endif /* __F16CINTRIN_H */
Remove some stray underscores from copyright block. Fix first line length to match length of the one after the copyright block. llvm-svn: 191483 2013-09-27 11:57:18 +08:00			`/*===---- f16cintrin.h - F16C intrinsics -----------------------------------===`
X86: add F16C support in Clang Support the following intrinsics: _mm_cvtph_ps, _mm256_cvtph_ps, _mm_cvtps_ph, _mm256_cvtps_ph rdar://12407875 llvm-svn: 165685 2012-10-11 08:59:55 +08:00			`*`
Remove some stray underscores from copyright block. Fix first line length to match length of the one after the copyright block. llvm-svn: 191483 2013-09-27 11:57:18 +08:00			`* Permission is hereby granted, free of charge, to any person obtaining a copy`
X86: add F16C support in Clang Support the following intrinsics: _mm_cvtph_ps, _mm256_cvtph_ps, _mm_cvtps_ph, _mm256_cvtps_ph rdar://12407875 llvm-svn: 165685 2012-10-11 08:59:55 +08:00			`* of this software and associated documentation files (the "Software"), to deal`
			`* in the Software without restriction, including without limitation the rights`
			`* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell`
			`* copies of the Software, and to permit persons to whom the Software is`
			`* furnished to do so, subject to the following conditions:`
			`*`
			`* The above copyright notice and this permission notice shall be included in`
			`* all copies or substantial portions of the Software.`
			`*`
			`* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR`
			`* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,`
			`* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE`
			`* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER`
			`* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,`
			`* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN`
			`* THE SOFTWARE.`
			`*`
			`*===-----------------------------------------------------------------------===`
			`*/`

[X86] Make f16c intrinsics accessible through emmintrin.h, per Intel docs Differential Revision: http://reviews.llvm.org/D13015 llvm-svn: 248156 2015-09-21 21:34:47 +08:00			`#if !defined __X86INTRIN_H && !defined __EMMINTRIN_H && !defined __IMMINTRIN_H`
			`#error "Never use <f16cintrin.h> directly; include <emmintrin.h> instead."`
X86: add F16C support in Clang Support the following intrinsics: _mm_cvtph_ps, _mm256_cvtph_ps, _mm_cvtps_ph, _mm256_cvtps_ph rdar://12407875 llvm-svn: 165685 2012-10-11 08:59:55 +08:00			`#endif`

			`#ifndef __F16CINTRIN_H`
			`#define __F16CINTRIN_H`

Use a define for per-file function attributes for the Intel intrinsic headers. This is a precursor to changing them to use the new target attribute code. llvm-svn: 239882 2015-06-17 15:09:20 +08:00			`/* Define the default attributes for the functions in this file. */`
This patch adds doxygen comments for all the intrinsincs in the header file f16cintrin.h. The doxygen comments are automatically generated based on Sony's intrinsics document. Differential Revision: http://reviews.llvm.org/D17021 llvm-svn: 260333 2016-02-10 08:12:24 +08:00			`#define __DEFAULT_FN_ATTRS \`
2 missing intrinsics _cvtss_sh and _mm_cvtps_ph were added to the intrinsics header f16intrin.h Differential Revision: http://reviews.llvm.org/D16177 llvm-svn: 258492 2016-01-22 14:50:50 +08:00			`__attribute__((__always_inline__, __nodebug__, __target__("f16c")))`
Use a define for per-file function attributes for the Intel intrinsic headers. This is a precursor to changing them to use the new target attribute code. llvm-svn: 239882 2015-06-17 15:09:20 +08:00
This patch adds doxygen comments for all the intrinsincs in the header file f16cintrin.h. The doxygen comments are automatically generated based on Sony's intrinsics document. Differential Revision: http://reviews.llvm.org/D17021 llvm-svn: 260333 2016-02-10 08:12:24 +08:00			`/// \brief Converts a 16-bit half-precision float value into a 32-bit float`
			`/// value.`
			`///`
			`/// \headerfile <x86intrin.h>`
			`///`
[DOXYGEN] Improved doxygen comments for x86 intrinsics headers. Tagged instruction names with <c> INSTR_NAME </c> to display them in typewriter font. In the past, \c command was used, unfortunately it applied to only one word. <c> .. </c> has the same meaning, but applies to all words in between the tags. llvm-svn: 289249 2016-12-10 02:35:50 +08:00			`/// This intrinsic corresponds to the <c> VCVTPH2PS </c> instruction.`
This patch adds doxygen comments for all the intrinsincs in the header file f16cintrin.h. The doxygen comments are automatically generated based on Sony's intrinsics document. Differential Revision: http://reviews.llvm.org/D17021 llvm-svn: 260333 2016-02-10 08:12:24 +08:00			`///`
Doxygen comments for avxintrin.h. Added doxygen comments to avxintrin.h's intrinsics. As of now, only around 50% of the intrinsics in this file are documented here. The patches for the other half will be sent out later. Updated bmiintrin.h to fix an incorrect section name. Updated f16cintrin.h to fix incorect parameter names. The doxygen comments are automatically generated based on Sony's intrinsics document. I got an OK from Eric Christopher to commit doxygen comments without prior code review upstream. llvm-svn: 269718 2016-05-17 06:54:45 +08:00			`/// \param __a`
This patch adds doxygen comments for all the intrinsincs in the header file f16cintrin.h. The doxygen comments are automatically generated based on Sony's intrinsics document. Differential Revision: http://reviews.llvm.org/D17021 llvm-svn: 260333 2016-02-10 08:12:24 +08:00			`/// A 16-bit half-precision float value.`
			`/// \returns The converted 32-bit float value.`
2 missing intrinsics _cvtss_sh and _mm_cvtps_ph were added to the intrinsics header f16intrin.h Differential Revision: http://reviews.llvm.org/D16177 llvm-svn: 258492 2016-01-22 14:50:50 +08:00			`static __inline float __DEFAULT_FN_ATTRS`
Use __ before argument names in provided headers. llvm-svn: 260631 2016-02-12 08:32:23 +08:00			`_cvtsh_ss(unsigned short __a)`
2 missing intrinsics _cvtss_sh and _mm_cvtps_ph were added to the intrinsics header f16intrin.h Differential Revision: http://reviews.llvm.org/D16177 llvm-svn: 258492 2016-01-22 14:50:50 +08:00			`{`
Use __ before argument names in provided headers. llvm-svn: 260631 2016-02-12 08:32:23 +08:00			`__v8hi v = {(short)__a, 0, 0, 0, 0, 0, 0, 0};`
2 missing intrinsics _cvtss_sh and _mm_cvtps_ph were added to the intrinsics header f16intrin.h Differential Revision: http://reviews.llvm.org/D16177 llvm-svn: 258492 2016-01-22 14:50:50 +08:00			`__v4sf r = __builtin_ia32_vcvtph2ps(v);`
			`return r[0];`
			`}`

This patch adds doxygen comments for all the intrinsincs in the header file f16cintrin.h. The doxygen comments are automatically generated based on Sony's intrinsics document. Differential Revision: http://reviews.llvm.org/D17021 llvm-svn: 260333 2016-02-10 08:12:24 +08:00			`/// \brief Converts a 32-bit single-precision float value to a 16-bit`
			`/// half-precision float value.`
			`///`
			`/// \headerfile <x86intrin.h>`
			`///`
			`/// \code`
			`/// unsigned short _cvtss_sh(float a, const int imm);`
			`/// \endcode`
			`///`
[DOXYGEN] Improved doxygen comments for x86 intrinsics headers. Tagged instruction names with <c> INSTR_NAME </c> to display them in typewriter font. In the past, \c command was used, unfortunately it applied to only one word. <c> .. </c> has the same meaning, but applies to all words in between the tags. llvm-svn: 289249 2016-12-10 02:35:50 +08:00			`/// This intrinsic corresponds to the <c> VCVTPS2PH </c> instruction.`
This patch adds doxygen comments for all the intrinsincs in the header file f16cintrin.h. The doxygen comments are automatically generated based on Sony's intrinsics document. Differential Revision: http://reviews.llvm.org/D17021 llvm-svn: 260333 2016-02-10 08:12:24 +08:00			`///`
			`/// \param a`
			`/// A 32-bit single-precision float value to be converted to a 16-bit`
			`/// half-precision float value.`
			`/// \param imm`
[DOXYGEN] Improved doxygen comments for x86 intrinsics. Improved doxygen comments for the following intrinsics headers: __wmmintrin_pclmul.h, bmiintrin.h, emmintrin.h, f16cintrin.h, immintrin.h, mmintrin.h, pmmintrin.h, tmmintrin.h Added \n commands to insert a line breaks where necessary, since one long line of documentation is nearly unreadable. Formatted comments to fit into 80 chars. In some cases added \a command in front of the parameter names to display them in italics. llvm-svn: 290561 2016-12-27 08:49:38 +08:00			`/// An immediate value controlling rounding using bits [2:0]: \n`
			`/// 000: Nearest \n`
			`/// 001: Down \n`
			`/// 010: Up \n`
			`/// 011: Truncate \n`
This patch adds doxygen comments for all the intrinsincs in the header file f16cintrin.h. The doxygen comments are automatically generated based on Sony's intrinsics document. Differential Revision: http://reviews.llvm.org/D17021 llvm-svn: 260333 2016-02-10 08:12:24 +08:00			`/// 1XX: Use MXCSR.RC for rounding`
			`/// \returns The converted 16-bit half-precision float value.`
Recommit r299321 '[X86] Add __extension__ to f16c macro intrinsics to suppress warnings about compound literals when compiled for with earlier language standards enabled.' The bot didn't recover after the revert. So it looks like this wasn't the issue. llvm-svn: 299397 2017-04-04 06:59:30 +08:00			`#define _cvtss_sh(a, imm) __extension__ ({ \`
			`(unsigned short)(((__v8hi)__builtin_ia32_vcvtps2ph((__v4sf){a, 0, 0, 0}, \`
			`(imm)))[0]); })`
2 missing intrinsics _cvtss_sh and _mm_cvtps_ph were added to the intrinsics header f16intrin.h Differential Revision: http://reviews.llvm.org/D16177 llvm-svn: 258492 2016-01-22 14:50:50 +08:00
This patch adds doxygen comments for all the intrinsincs in the header file f16cintrin.h. The doxygen comments are automatically generated based on Sony's intrinsics document. Differential Revision: http://reviews.llvm.org/D17021 llvm-svn: 260333 2016-02-10 08:12:24 +08:00			`/// \brief Converts a 128-bit vector containing 32-bit float values into a`
			`/// 128-bit vector containing 16-bit half-precision float values.`
			`///`
			`/// \headerfile <x86intrin.h>`
			`///`
			`/// \code`
			`/// __m128i _mm_cvtps_ph(__m128 a, const int imm);`
			`/// \endcode`
			`///`
[DOXYGEN] Improved doxygen comments for x86 intrinsics headers. Tagged instruction names with <c> INSTR_NAME </c> to display them in typewriter font. In the past, \c command was used, unfortunately it applied to only one word. <c> .. </c> has the same meaning, but applies to all words in between the tags. llvm-svn: 289249 2016-12-10 02:35:50 +08:00			`/// This intrinsic corresponds to the <c> VCVTPS2PH </c> instruction.`
This patch adds doxygen comments for all the intrinsincs in the header file f16cintrin.h. The doxygen comments are automatically generated based on Sony's intrinsics document. Differential Revision: http://reviews.llvm.org/D17021 llvm-svn: 260333 2016-02-10 08:12:24 +08:00			`///`
			`/// \param a`
			`/// A 128-bit vector containing 32-bit float values.`
			`/// \param imm`
[DOXYGEN] Improved doxygen comments for x86 intrinsics. Improved doxygen comments for the following intrinsics headers: __wmmintrin_pclmul.h, bmiintrin.h, emmintrin.h, f16cintrin.h, immintrin.h, mmintrin.h, pmmintrin.h, tmmintrin.h Added \n commands to insert a line breaks where necessary, since one long line of documentation is nearly unreadable. Formatted comments to fit into 80 chars. In some cases added \a command in front of the parameter names to display them in italics. llvm-svn: 290561 2016-12-27 08:49:38 +08:00			`/// An immediate value controlling rounding using bits [2:0]: \n`
			`/// 000: Nearest \n`
			`/// 001: Down \n`
			`/// 010: Up \n`
			`/// 011: Truncate \n`
This patch adds doxygen comments for all the intrinsincs in the header file f16cintrin.h. The doxygen comments are automatically generated based on Sony's intrinsics document. Differential Revision: http://reviews.llvm.org/D17021 llvm-svn: 260333 2016-02-10 08:12:24 +08:00			`/// 1XX: Use MXCSR.RC for rounding`
			`/// \returns A 128-bit vector containing converted 16-bit half-precision float`
			`/// values. The lower 64 bits are used to store the converted 16-bit`
			`/// half-precision floating-point values.`
Recommit r299321 '[X86] Add __extension__ to f16c macro intrinsics to suppress warnings about compound literals when compiled for with earlier language standards enabled.' The bot didn't recover after the revert. So it looks like this wasn't the issue. llvm-svn: 299397 2017-04-04 06:59:30 +08:00			`#define _mm_cvtps_ph(a, imm) __extension__ ({ \`
			`(__m128i)__builtin_ia32_vcvtps2ph((__v4sf)(__m128)(a), (imm)); })`
X86: add F16C support in Clang Support the following intrinsics: _mm_cvtph_ps, _mm256_cvtph_ps, _mm_cvtps_ph, _mm256_cvtps_ph rdar://12407875 llvm-svn: 165685 2012-10-11 08:59:55 +08:00
This patch adds doxygen comments for all the intrinsincs in the header file f16cintrin.h. The doxygen comments are automatically generated based on Sony's intrinsics document. Differential Revision: http://reviews.llvm.org/D17021 llvm-svn: 260333 2016-02-10 08:12:24 +08:00			`/// \brief Converts a 128-bit vector containing 16-bit half-precision float`
			`/// values into a 128-bit vector containing 32-bit float values.`
			`///`
			`/// \headerfile <x86intrin.h>`
			`///`
[DOXYGEN] Improved doxygen comments for x86 intrinsics headers. Tagged instruction names with <c> INSTR_NAME </c> to display them in typewriter font. In the past, \c command was used, unfortunately it applied to only one word. <c> .. </c> has the same meaning, but applies to all words in between the tags. llvm-svn: 289249 2016-12-10 02:35:50 +08:00			`/// This intrinsic corresponds to the <c> VCVTPH2PS </c> instruction.`
This patch adds doxygen comments for all the intrinsincs in the header file f16cintrin.h. The doxygen comments are automatically generated based on Sony's intrinsics document. Differential Revision: http://reviews.llvm.org/D17021 llvm-svn: 260333 2016-02-10 08:12:24 +08:00			`///`
Doxygen comments for avxintrin.h. Added doxygen comments to avxintrin.h's intrinsics. As of now, only around 50% of the intrinsics in this file are documented here. The patches for the other half will be sent out later. Updated bmiintrin.h to fix an incorrect section name. Updated f16cintrin.h to fix incorect parameter names. The doxygen comments are automatically generated based on Sony's intrinsics document. I got an OK from Eric Christopher to commit doxygen comments without prior code review upstream. llvm-svn: 269718 2016-05-17 06:54:45 +08:00			`/// \param __a`
This patch adds doxygen comments for all the intrinsincs in the header file f16cintrin.h. The doxygen comments are automatically generated based on Sony's intrinsics document. Differential Revision: http://reviews.llvm.org/D17021 llvm-svn: 260333 2016-02-10 08:12:24 +08:00			`/// A 128-bit vector containing 16-bit half-precision float values. The lower`
			`/// 64 bits are used in the conversion.`
			`/// \returns A 128-bit vector of [4 x float] containing converted float values.`
[X86] Rename DEFAULT_FN_ATTR macro to __DEFAULT_FN_ATTR llvm-svn: 241065 2015-06-30 21:36:19 +08:00			`static __inline __m128 __DEFAULT_FN_ATTRS`
Use __ before argument names in provided headers. llvm-svn: 260631 2016-02-12 08:32:23 +08:00			`_mm_cvtph_ps(__m128i __a)`
X86: add F16C support in Clang Support the following intrinsics: _mm_cvtph_ps, _mm256_cvtph_ps, _mm_cvtps_ph, _mm256_cvtps_ph rdar://12407875 llvm-svn: 165685 2012-10-11 08:59:55 +08:00			`{`
Use __ before argument names in provided headers. llvm-svn: 260631 2016-02-12 08:32:23 +08:00			`return (__m128)__builtin_ia32_vcvtph2ps((__v8hi)__a);`
X86: add F16C support in Clang Support the following intrinsics: _mm_cvtph_ps, _mm256_cvtph_ps, _mm_cvtps_ph, _mm256_cvtps_ph rdar://12407875 llvm-svn: 165685 2012-10-11 08:59:55 +08:00			`}`

[X86] Rename DEFAULT_FN_ATTR macro to __DEFAULT_FN_ATTR llvm-svn: 241065 2015-06-30 21:36:19 +08:00			`#undef __DEFAULT_FN_ATTRS`
Use a define for per-file function attributes for the Intel intrinsic headers. This is a precursor to changing them to use the new target attribute code. llvm-svn: 239882 2015-06-17 15:09:20 +08:00
X86: add F16C support in Clang Support the following intrinsics: _mm_cvtph_ps, _mm256_cvtph_ps, _mm_cvtps_ph, _mm256_cvtps_ph rdar://12407875 llvm-svn: 165685 2012-10-11 08:59:55 +08:00			`#endif /* __F16CINTRIN_H */`