123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374 |
- /*===---- immintrin.h - Intel intrinsics -----------------------------------===
- *
- * Permission is hereby granted, free of charge, to any person obtaining a copy
- * of this software and associated documentation files (the "Software"), to deal
- * in the Software without restriction, including without limitation the rights
- * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
- * copies of the Software, and to permit persons to whom the Software is
- * furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice shall be included in
- * all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
- * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
- * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
- * THE SOFTWARE.
- *
- *===-----------------------------------------------------------------------===
- */
- #ifndef __IMMINTRIN_H
- #define __IMMINTRIN_H
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__MMX__)
- #include <mmintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__SSE__)
- #include <xmmintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__SSE2__)
- #include <emmintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__SSE3__)
- #include <pmmintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__SSSE3__)
- #include <tmmintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || \
- (defined(__SSE4_2__) || defined(__SSE4_1__))
- #include <smmintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || \
- (defined(__AES__) || defined(__PCLMUL__))
- #include <wmmintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__CLFLUSHOPT__)
- #include <clflushoptintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__CLWB__)
- #include <clwbintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX__)
- #include <avxintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX2__)
- #include <avx2intrin.h>
- /* The 256-bit versions of functions in f16cintrin.h.
- Intel documents these as being in immintrin.h, and
- they depend on typedefs from avxintrin.h. */
- /// \brief Converts a 256-bit vector of [8 x float] into a 128-bit vector
- /// containing 16-bit half-precision float values.
- ///
- /// \headerfile <x86intrin.h>
- ///
- /// \code
- /// __m128i _mm256_cvtps_ph(__m256 a, const int imm);
- /// \endcode
- ///
- /// This intrinsic corresponds to the <c> VCVTPS2PH </c> instruction.
- ///
- /// \param a
- /// A 256-bit vector containing 32-bit single-precision float values to be
- /// converted to 16-bit half-precision float values.
- /// \param imm
- /// An immediate value controlling rounding using bits [2:0]: \n
- /// 000: Nearest \n
- /// 001: Down \n
- /// 010: Up \n
- /// 011: Truncate \n
- /// 1XX: Use MXCSR.RC for rounding
- /// \returns A 128-bit vector containing the converted 16-bit half-precision
- /// float values.
- #define _mm256_cvtps_ph(a, imm) __extension__ ({ \
- (__m128i)__builtin_ia32_vcvtps2ph256((__v8sf)(__m256)(a), (imm)); })
- /// \brief Converts a 128-bit vector containing 16-bit half-precision float
- /// values into a 256-bit vector of [8 x float].
- ///
- /// \headerfile <x86intrin.h>
- ///
- /// This intrinsic corresponds to the <c> VCVTPH2PS </c> instruction.
- ///
- /// \param __a
- /// A 128-bit vector containing 16-bit half-precision float values to be
- /// converted to 32-bit single-precision float values.
- /// \returns A vector of [8 x float] containing the converted 32-bit
- /// single-precision float values.
- static __inline __m256 __attribute__((__always_inline__, __nodebug__, __target__("f16c")))
- _mm256_cvtph_ps(__m128i __a)
- {
- return (__m256)__builtin_ia32_vcvtph2ps256((__v8hi)__a);
- }
- #endif /* __AVX2__ */
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__VPCLMULQDQ__)
- #include <vpclmulqdqintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__BMI__)
- #include <bmiintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__BMI2__)
- #include <bmi2intrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__LZCNT__)
- #include <lzcntintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__FMA__)
- #include <fmaintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512F__)
- #include <avx512fintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512VL__)
- #include <avx512vlintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512BW__)
- #include <avx512bwintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512BITALG__)
- #include <avx512bitalgintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512CD__)
- #include <avx512cdintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512VPOPCNTDQ__)
- #include <avx512vpopcntdqintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || \
- (defined(__AVX512VL__) && defined(__AVX512VPOPCNTDQ__))
- #include <avx512vpopcntdqvlintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512VNNI__)
- #include <avx512vnniintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || \
- (defined(__AVX512VL__) && defined(__AVX512VNNI__))
- #include <avx512vlvnniintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512DQ__)
- #include <avx512dqintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || \
- (defined(__AVX512VL__) && defined(__AVX512BITALG__))
- #include <avx512vlbitalgintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || \
- (defined(__AVX512VL__) && defined(__AVX512BW__))
- #include <avx512vlbwintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || \
- (defined(__AVX512VL__) && defined(__AVX512CD__))
- #include <avx512vlcdintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || \
- (defined(__AVX512VL__) && defined(__AVX512DQ__))
- #include <avx512vldqintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512ER__)
- #include <avx512erintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512IFMA__)
- #include <avx512ifmaintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || \
- (defined(__AVX512IFMA__) && defined(__AVX512VL__))
- #include <avx512ifmavlintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512VBMI__)
- #include <avx512vbmiintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || \
- (defined(__AVX512VBMI__) && defined(__AVX512VL__))
- #include <avx512vbmivlintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512VBMI2__)
- #include <avx512vbmi2intrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || \
- (defined(__AVX512VBMI2__) && defined(__AVX512VL__))
- #include <avx512vlvbmi2intrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__AVX512PF__)
- #include <avx512pfintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__PKU__)
- #include <pkuintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__VAES__)
- #include <vaesintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__GFNI__)
- #include <gfniintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__RDRND__)
- static __inline__ int __attribute__((__always_inline__, __nodebug__, __target__("rdrnd")))
- _rdrand16_step(unsigned short *__p)
- {
- return __builtin_ia32_rdrand16_step(__p);
- }
- static __inline__ int __attribute__((__always_inline__, __nodebug__, __target__("rdrnd")))
- _rdrand32_step(unsigned int *__p)
- {
- return __builtin_ia32_rdrand32_step(__p);
- }
- #ifdef __x86_64__
- static __inline__ int __attribute__((__always_inline__, __nodebug__, __target__("rdrnd")))
- _rdrand64_step(unsigned long long *__p)
- {
- return __builtin_ia32_rdrand64_step(__p);
- }
- #endif
- #endif /* __RDRND__ */
- /* __bit_scan_forward */
- static __inline__ int __attribute__((__always_inline__, __nodebug__))
- _bit_scan_forward(int __A) {
- return __builtin_ctz(__A);
- }
- /* __bit_scan_reverse */
- static __inline__ int __attribute__((__always_inline__, __nodebug__))
- _bit_scan_reverse(int __A) {
- return 31 - __builtin_clz(__A);
- }
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__FSGSBASE__)
- #ifdef __x86_64__
- static __inline__ unsigned int __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
- _readfsbase_u32(void)
- {
- return __builtin_ia32_rdfsbase32();
- }
- static __inline__ unsigned long long __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
- _readfsbase_u64(void)
- {
- return __builtin_ia32_rdfsbase64();
- }
- static __inline__ unsigned int __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
- _readgsbase_u32(void)
- {
- return __builtin_ia32_rdgsbase32();
- }
- static __inline__ unsigned long long __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
- _readgsbase_u64(void)
- {
- return __builtin_ia32_rdgsbase64();
- }
- static __inline__ void __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
- _writefsbase_u32(unsigned int __V)
- {
- return __builtin_ia32_wrfsbase32(__V);
- }
- static __inline__ void __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
- _writefsbase_u64(unsigned long long __V)
- {
- return __builtin_ia32_wrfsbase64(__V);
- }
- static __inline__ void __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
- _writegsbase_u32(unsigned int __V)
- {
- return __builtin_ia32_wrgsbase32(__V);
- }
- static __inline__ void __attribute__((__always_inline__, __nodebug__, __target__("fsgsbase")))
- _writegsbase_u64(unsigned long long __V)
- {
- return __builtin_ia32_wrgsbase64(__V);
- }
- #endif
- #endif /* __FSGSBASE__ */
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__RTM__)
- #include <rtmintrin.h>
- #include <xtestintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__SHA__)
- #include <shaintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__FXSR__)
- #include <fxsrintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__XSAVE__)
- #include <xsaveintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__XSAVEOPT__)
- #include <xsaveoptintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__XSAVEC__)
- #include <xsavecintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__XSAVES__)
- #include <xsavesintrin.h>
- #endif
- #if !defined(_MSC_VER) || __has_feature(modules) || defined(__SHSTK__)
- #include <cetintrin.h>
- #endif
- /* Some intrinsics inside adxintrin.h are available only on processors with ADX,
- * whereas others are also available at all times. */
- #include <adxintrin.h>
- #endif /* __IMMINTRIN_H */
|