avx512vbmiintrin.h 4.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137
  1. /*===------------- avx512vbmiintrin.h - VBMI intrinsics ------------------===
  2. *
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a copy
  5. * of this software and associated documentation files (the "Software"), to deal
  6. * in the Software without restriction, including without limitation the rights
  7. * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  8. * copies of the Software, and to permit persons to whom the Software is
  9. * furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  17. * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  18. * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  19. * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
  20. * THE SOFTWARE.
  21. *
  22. *===-----------------------------------------------------------------------===
  23. */
  24. #ifndef __IMMINTRIN_H
  25. #error "Never use <avx512vbmiintrin.h> directly; include <immintrin.h> instead."
  26. #endif
  27. #ifndef __VBMIINTRIN_H
  28. #define __VBMIINTRIN_H
  29. /* Define the default attributes for the functions in this file. */
  30. #define __DEFAULT_FN_ATTRS __attribute__((__always_inline__, __nodebug__, __target__("avx512vbmi")))
  31. static __inline__ __m512i __DEFAULT_FN_ATTRS
  32. _mm512_mask2_permutex2var_epi8 (__m512i __A, __m512i __I,
  33. __mmask64 __U, __m512i __B)
  34. {
  35. return (__m512i) __builtin_ia32_vpermi2varqi512_mask ((__v64qi) __A,
  36. (__v64qi) __I
  37. /* idx */ ,
  38. (__v64qi) __B,
  39. (__mmask64) __U);
  40. }
  41. static __inline__ __m512i __DEFAULT_FN_ATTRS
  42. _mm512_permutex2var_epi8 (__m512i __A, __m512i __I, __m512i __B)
  43. {
  44. return (__m512i) __builtin_ia32_vpermt2varqi512_mask ((__v64qi) __I
  45. /* idx */ ,
  46. (__v64qi) __A,
  47. (__v64qi) __B,
  48. (__mmask64) -1);
  49. }
  50. static __inline__ __m512i __DEFAULT_FN_ATTRS
  51. _mm512_mask_permutex2var_epi8 (__m512i __A, __mmask64 __U,
  52. __m512i __I, __m512i __B)
  53. {
  54. return (__m512i) __builtin_ia32_vpermt2varqi512_mask ((__v64qi) __I
  55. /* idx */ ,
  56. (__v64qi) __A,
  57. (__v64qi) __B,
  58. (__mmask64) __U);
  59. }
  60. static __inline__ __m512i __DEFAULT_FN_ATTRS
  61. _mm512_maskz_permutex2var_epi8 (__mmask64 __U, __m512i __A,
  62. __m512i __I, __m512i __B)
  63. {
  64. return (__m512i) __builtin_ia32_vpermt2varqi512_maskz ((__v64qi) __I
  65. /* idx */ ,
  66. (__v64qi) __A,
  67. (__v64qi) __B,
  68. (__mmask64) __U);
  69. }
  70. static __inline__ __m512i __DEFAULT_FN_ATTRS
  71. _mm512_permutexvar_epi8 (__m512i __A, __m512i __B)
  72. {
  73. return (__m512i) __builtin_ia32_permvarqi512_mask ((__v64qi) __B,
  74. (__v64qi) __A,
  75. (__v64qi) _mm512_undefined_epi32 (),
  76. (__mmask64) -1);
  77. }
  78. static __inline__ __m512i __DEFAULT_FN_ATTRS
  79. _mm512_maskz_permutexvar_epi8 (__mmask64 __M, __m512i __A,
  80. __m512i __B)
  81. {
  82. return (__m512i) __builtin_ia32_permvarqi512_mask ((__v64qi) __B,
  83. (__v64qi) __A,
  84. (__v64qi) _mm512_setzero_si512(),
  85. (__mmask64) __M);
  86. }
  87. static __inline__ __m512i __DEFAULT_FN_ATTRS
  88. _mm512_mask_permutexvar_epi8 (__m512i __W, __mmask64 __M, __m512i __A,
  89. __m512i __B)
  90. {
  91. return (__m512i) __builtin_ia32_permvarqi512_mask ((__v64qi) __B,
  92. (__v64qi) __A,
  93. (__v64qi) __W,
  94. (__mmask64) __M);
  95. }
  96. static __inline__ __m512i __DEFAULT_FN_ATTRS
  97. _mm512_mask_multishift_epi64_epi8 (__m512i __W, __mmask64 __M, __m512i __X, __m512i __Y)
  98. {
  99. return (__m512i) __builtin_ia32_vpmultishiftqb512_mask ((__v64qi) __X,
  100. (__v64qi) __Y,
  101. (__v64qi) __W,
  102. (__mmask64) __M);
  103. }
  104. static __inline__ __m512i __DEFAULT_FN_ATTRS
  105. _mm512_maskz_multishift_epi64_epi8 (__mmask64 __M, __m512i __X, __m512i __Y)
  106. {
  107. return (__m512i) __builtin_ia32_vpmultishiftqb512_mask ((__v64qi) __X,
  108. (__v64qi) __Y,
  109. (__v64qi) _mm512_setzero_si512 (),
  110. (__mmask64) __M);
  111. }
  112. static __inline__ __m512i __DEFAULT_FN_ATTRS
  113. _mm512_multishift_epi64_epi8 (__m512i __X, __m512i __Y)
  114. {
  115. return (__m512i) __builtin_ia32_vpmultishiftqb512_mask ((__v64qi) __X,
  116. (__v64qi) __Y,
  117. (__v64qi) _mm512_undefined_epi32 (),
  118. (__mmask64) -1);
  119. }
  120. #undef __DEFAULT_FN_ATTRS
  121. #endif