25 #error "Never use <avx512bwintrin.h> directly; include <immintrin.h> instead." 28 #ifndef __AVX512BWINTRIN_H 29 #define __AVX512BWINTRIN_H 35 #define __DEFAULT_FN_ATTRS512 __attribute__((__always_inline__, __nodebug__, __target__("avx512bw"), __min_vector_width__(512))) 36 #define __DEFAULT_FN_ATTRS __attribute__((__always_inline__, __nodebug__, __target__("avx512bw"))) 41 return __builtin_ia32_knotsi(__M);
47 return __builtin_ia32_knotdi(__M);
113 return (
unsigned char)__builtin_ia32_kortestcsi(__A, __B);
119 return (
unsigned char)__builtin_ia32_kortestzsi(__A, __B);
124 *__C = (
unsigned char)__builtin_ia32_kortestcsi(__A, __B);
125 return (
unsigned char)__builtin_ia32_kortestzsi(__A, __B);
131 return (
unsigned char)__builtin_ia32_kortestcdi(__A, __B);
137 return (
unsigned char)__builtin_ia32_kortestzdi(__A, __B);
142 *__C = (
unsigned char)__builtin_ia32_kortestcdi(__A, __B);
143 return (
unsigned char)__builtin_ia32_kortestzdi(__A, __B);
149 return (
unsigned char)__builtin_ia32_ktestcsi(__A, __B);
155 return (
unsigned char)__builtin_ia32_ktestzsi(__A, __B);
160 *__C = (
unsigned char)__builtin_ia32_ktestcsi(__A, __B);
161 return (
unsigned char)__builtin_ia32_ktestzsi(__A, __B);
167 return (
unsigned char)__builtin_ia32_ktestcdi(__A, __B);
173 return (
unsigned char)__builtin_ia32_ktestzdi(__A, __B);
178 *__C = (
unsigned char)__builtin_ia32_ktestcdi(__A, __B);
179 return (
unsigned char)__builtin_ia32_ktestzdi(__A, __B);
194 #define _kshiftli_mask32(A, I) \ 195 (__mmask32)__builtin_ia32_kshiftlisi((__mmask32)(A), (unsigned int)(I)) 197 #define _kshiftri_mask32(A, I) \ 198 (__mmask32)__builtin_ia32_kshiftrisi((__mmask32)(A), (unsigned int)(I)) 200 #define _kshiftli_mask64(A, I) \ 201 (__mmask64)__builtin_ia32_kshiftlidi((__mmask64)(A), (unsigned int)(I)) 203 #define _kshiftri_mask64(A, I) \ 204 (__mmask64)__builtin_ia32_kshiftridi((__mmask64)(A), (unsigned int)(I)) 208 return (
unsigned int)__builtin_ia32_kmovd((
__mmask32)__A);
213 return (
unsigned long long)__builtin_ia32_kmovq((
__mmask64)__A);
248 #define _mm512_cmp_epi8_mask(a, b, p) \ 249 (__mmask64)__builtin_ia32_cmpb512_mask((__v64qi)(__m512i)(a), \ 250 (__v64qi)(__m512i)(b), (int)(p), \ 253 #define _mm512_mask_cmp_epi8_mask(m, a, b, p) \ 254 (__mmask64)__builtin_ia32_cmpb512_mask((__v64qi)(__m512i)(a), \ 255 (__v64qi)(__m512i)(b), (int)(p), \ 258 #define _mm512_cmp_epu8_mask(a, b, p) \ 259 (__mmask64)__builtin_ia32_ucmpb512_mask((__v64qi)(__m512i)(a), \ 260 (__v64qi)(__m512i)(b), (int)(p), \ 263 #define _mm512_mask_cmp_epu8_mask(m, a, b, p) \ 264 (__mmask64)__builtin_ia32_ucmpb512_mask((__v64qi)(__m512i)(a), \ 265 (__v64qi)(__m512i)(b), (int)(p), \ 268 #define _mm512_cmp_epi16_mask(a, b, p) \ 269 (__mmask32)__builtin_ia32_cmpw512_mask((__v32hi)(__m512i)(a), \ 270 (__v32hi)(__m512i)(b), (int)(p), \ 273 #define _mm512_mask_cmp_epi16_mask(m, a, b, p) \ 274 (__mmask32)__builtin_ia32_cmpw512_mask((__v32hi)(__m512i)(a), \ 275 (__v32hi)(__m512i)(b), (int)(p), \ 278 #define _mm512_cmp_epu16_mask(a, b, p) \ 279 (__mmask32)__builtin_ia32_ucmpw512_mask((__v32hi)(__m512i)(a), \ 280 (__v32hi)(__m512i)(b), (int)(p), \ 283 #define _mm512_mask_cmp_epu16_mask(m, a, b, p) \ 284 (__mmask32)__builtin_ia32_ucmpw512_mask((__v32hi)(__m512i)(a), \ 285 (__v32hi)(__m512i)(b), (int)(p), \ 288 #define _mm512_cmpeq_epi8_mask(A, B) \ 289 _mm512_cmp_epi8_mask((A), (B), _MM_CMPINT_EQ) 290 #define _mm512_mask_cmpeq_epi8_mask(k, A, B) \ 291 _mm512_mask_cmp_epi8_mask((k), (A), (B), _MM_CMPINT_EQ) 292 #define _mm512_cmpge_epi8_mask(A, B) \ 293 _mm512_cmp_epi8_mask((A), (B), _MM_CMPINT_GE) 294 #define _mm512_mask_cmpge_epi8_mask(k, A, B) \ 295 _mm512_mask_cmp_epi8_mask((k), (A), (B), _MM_CMPINT_GE) 296 #define _mm512_cmpgt_epi8_mask(A, B) \ 297 _mm512_cmp_epi8_mask((A), (B), _MM_CMPINT_GT) 298 #define _mm512_mask_cmpgt_epi8_mask(k, A, B) \ 299 _mm512_mask_cmp_epi8_mask((k), (A), (B), _MM_CMPINT_GT) 300 #define _mm512_cmple_epi8_mask(A, B) \ 301 _mm512_cmp_epi8_mask((A), (B), _MM_CMPINT_LE) 302 #define _mm512_mask_cmple_epi8_mask(k, A, B) \ 303 _mm512_mask_cmp_epi8_mask((k), (A), (B), _MM_CMPINT_LE) 304 #define _mm512_cmplt_epi8_mask(A, B) \ 305 _mm512_cmp_epi8_mask((A), (B), _MM_CMPINT_LT) 306 #define _mm512_mask_cmplt_epi8_mask(k, A, B) \ 307 _mm512_mask_cmp_epi8_mask((k), (A), (B), _MM_CMPINT_LT) 308 #define _mm512_cmpneq_epi8_mask(A, B) \ 309 _mm512_cmp_epi8_mask((A), (B), _MM_CMPINT_NE) 310 #define _mm512_mask_cmpneq_epi8_mask(k, A, B) \ 311 _mm512_mask_cmp_epi8_mask((k), (A), (B), _MM_CMPINT_NE) 313 #define _mm512_cmpeq_epu8_mask(A, B) \ 314 _mm512_cmp_epu8_mask((A), (B), _MM_CMPINT_EQ) 315 #define _mm512_mask_cmpeq_epu8_mask(k, A, B) \ 316 _mm512_mask_cmp_epu8_mask((k), (A), (B), _MM_CMPINT_EQ) 317 #define _mm512_cmpge_epu8_mask(A, B) \ 318 _mm512_cmp_epu8_mask((A), (B), _MM_CMPINT_GE) 319 #define _mm512_mask_cmpge_epu8_mask(k, A, B) \ 320 _mm512_mask_cmp_epu8_mask((k), (A), (B), _MM_CMPINT_GE) 321 #define _mm512_cmpgt_epu8_mask(A, B) \ 322 _mm512_cmp_epu8_mask((A), (B), _MM_CMPINT_GT) 323 #define _mm512_mask_cmpgt_epu8_mask(k, A, B) \ 324 _mm512_mask_cmp_epu8_mask((k), (A), (B), _MM_CMPINT_GT) 325 #define _mm512_cmple_epu8_mask(A, B) \ 326 _mm512_cmp_epu8_mask((A), (B), _MM_CMPINT_LE) 327 #define _mm512_mask_cmple_epu8_mask(k, A, B) \ 328 _mm512_mask_cmp_epu8_mask((k), (A), (B), _MM_CMPINT_LE) 329 #define _mm512_cmplt_epu8_mask(A, B) \ 330 _mm512_cmp_epu8_mask((A), (B), _MM_CMPINT_LT) 331 #define _mm512_mask_cmplt_epu8_mask(k, A, B) \ 332 _mm512_mask_cmp_epu8_mask((k), (A), (B), _MM_CMPINT_LT) 333 #define _mm512_cmpneq_epu8_mask(A, B) \ 334 _mm512_cmp_epu8_mask((A), (B), _MM_CMPINT_NE) 335 #define _mm512_mask_cmpneq_epu8_mask(k, A, B) \ 336 _mm512_mask_cmp_epu8_mask((k), (A), (B), _MM_CMPINT_NE) 338 #define _mm512_cmpeq_epi16_mask(A, B) \ 339 _mm512_cmp_epi16_mask((A), (B), _MM_CMPINT_EQ) 340 #define _mm512_mask_cmpeq_epi16_mask(k, A, B) \ 341 _mm512_mask_cmp_epi16_mask((k), (A), (B), _MM_CMPINT_EQ) 342 #define _mm512_cmpge_epi16_mask(A, B) \ 343 _mm512_cmp_epi16_mask((A), (B), _MM_CMPINT_GE) 344 #define _mm512_mask_cmpge_epi16_mask(k, A, B) \ 345 _mm512_mask_cmp_epi16_mask((k), (A), (B), _MM_CMPINT_GE) 346 #define _mm512_cmpgt_epi16_mask(A, B) \ 347 _mm512_cmp_epi16_mask((A), (B), _MM_CMPINT_GT) 348 #define _mm512_mask_cmpgt_epi16_mask(k, A, B) \ 349 _mm512_mask_cmp_epi16_mask((k), (A), (B), _MM_CMPINT_GT) 350 #define _mm512_cmple_epi16_mask(A, B) \ 351 _mm512_cmp_epi16_mask((A), (B), _MM_CMPINT_LE) 352 #define _mm512_mask_cmple_epi16_mask(k, A, B) \ 353 _mm512_mask_cmp_epi16_mask((k), (A), (B), _MM_CMPINT_LE) 354 #define _mm512_cmplt_epi16_mask(A, B) \ 355 _mm512_cmp_epi16_mask((A), (B), _MM_CMPINT_LT) 356 #define _mm512_mask_cmplt_epi16_mask(k, A, B) \ 357 _mm512_mask_cmp_epi16_mask((k), (A), (B), _MM_CMPINT_LT) 358 #define _mm512_cmpneq_epi16_mask(A, B) \ 359 _mm512_cmp_epi16_mask((A), (B), _MM_CMPINT_NE) 360 #define _mm512_mask_cmpneq_epi16_mask(k, A, B) \ 361 _mm512_mask_cmp_epi16_mask((k), (A), (B), _MM_CMPINT_NE) 363 #define _mm512_cmpeq_epu16_mask(A, B) \ 364 _mm512_cmp_epu16_mask((A), (B), _MM_CMPINT_EQ) 365 #define _mm512_mask_cmpeq_epu16_mask(k, A, B) \ 366 _mm512_mask_cmp_epu16_mask((k), (A), (B), _MM_CMPINT_EQ) 367 #define _mm512_cmpge_epu16_mask(A, B) \ 368 _mm512_cmp_epu16_mask((A), (B), _MM_CMPINT_GE) 369 #define _mm512_mask_cmpge_epu16_mask(k, A, B) \ 370 _mm512_mask_cmp_epu16_mask((k), (A), (B), _MM_CMPINT_GE) 371 #define _mm512_cmpgt_epu16_mask(A, B) \ 372 _mm512_cmp_epu16_mask((A), (B), _MM_CMPINT_GT) 373 #define _mm512_mask_cmpgt_epu16_mask(k, A, B) \ 374 _mm512_mask_cmp_epu16_mask((k), (A), (B), _MM_CMPINT_GT) 375 #define _mm512_cmple_epu16_mask(A, B) \ 376 _mm512_cmp_epu16_mask((A), (B), _MM_CMPINT_LE) 377 #define _mm512_mask_cmple_epu16_mask(k, A, B) \ 378 _mm512_mask_cmp_epu16_mask((k), (A), (B), _MM_CMPINT_LE) 379 #define _mm512_cmplt_epu16_mask(A, B) \ 380 _mm512_cmp_epu16_mask((A), (B), _MM_CMPINT_LT) 381 #define _mm512_mask_cmplt_epu16_mask(k, A, B) \ 382 _mm512_mask_cmp_epu16_mask((k), (A), (B), _MM_CMPINT_LT) 383 #define _mm512_cmpneq_epu16_mask(A, B) \ 384 _mm512_cmp_epu16_mask((A), (B), _MM_CMPINT_NE) 385 #define _mm512_mask_cmpneq_epu16_mask(k, A, B) \ 386 _mm512_mask_cmp_epu16_mask((k), (A), (B), _MM_CMPINT_NE) 390 return (__m512i) ((__v64qu) __A + (__v64qu) __B);
395 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
402 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
409 return (__m512i) ((__v64qu) __A - (__v64qu) __B);
414 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
421 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
428 return (__m512i) ((__v32hu) __A + (__v32hu) __B);
433 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
440 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
447 return (__m512i) ((__v32hu) __A - (__v32hu) __B);
452 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
459 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
466 return (__m512i) ((__v32hu) __A * (__v32hu) __B);
471 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
478 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
486 return (__m512i) __builtin_ia32_selectb_512 ((
__mmask64) __U,
494 return (__m512i) __builtin_ia32_selectw_512 ((
__mmask32) __U,
502 return (__m512i)__builtin_ia32_pabsb512((__v64qi)__A);
508 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
516 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
524 return (__m512i)__builtin_ia32_pabsw512((__v32hi)__A);
530 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
538 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
546 return (__m512i)__builtin_ia32_packssdw512((__v16si)__A, (__v16si)__B);
552 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
560 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
568 return (__m512i)__builtin_ia32_packsswb512((__v32hi)__A, (__v32hi) __B);
574 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
582 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
590 return (__m512i)__builtin_ia32_packusdw512((__v16si) __A, (__v16si) __B);
596 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
604 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
612 return (__m512i)__builtin_ia32_packuswb512((__v32hi) __A, (__v32hi) __B);
618 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
626 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
634 return (__m512i)__builtin_ia32_paddsb512((__v64qi)__A, (__v64qi)__B);
640 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
648 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
656 return (__m512i)__builtin_ia32_paddsw512((__v32hi)__A, (__v32hi)__B);
662 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
670 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
678 return (__m512i)__builtin_ia32_paddusb512((__v64qi) __A, (__v64qi) __B);
684 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
692 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
700 return (__m512i)__builtin_ia32_paddusw512((__v32hi) __A, (__v32hi) __B);
706 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
714 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
722 typedef unsigned short __v64hu
__attribute__((__vector_size__(128)));
723 return (__m512i)__builtin_convertvector(
724 ((__builtin_convertvector((__v64qu) __A, __v64hu) +
725 __builtin_convertvector((__v64qu) __B, __v64hu)) + 1)
733 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
741 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
749 typedef unsigned int __v32su
__attribute__((__vector_size__(128)));
750 return (__m512i)__builtin_convertvector(
751 ((__builtin_convertvector((__v32hu) __A, __v32su) +
752 __builtin_convertvector((__v32hu) __B, __v32su)) + 1)
760 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
768 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
776 return (__m512i)__builtin_ia32_pmaxsb512((__v64qi) __A, (__v64qi) __B);
782 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
790 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
798 return (__m512i)__builtin_ia32_pmaxsw512((__v32hi) __A, (__v32hi) __B);
804 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
813 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
821 return (__m512i)__builtin_ia32_pmaxub512((__v64qi)__A, (__v64qi)__B);
827 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
835 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
843 return (__m512i)__builtin_ia32_pmaxuw512((__v32hi)__A, (__v32hi)__B);
849 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
857 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
865 return (__m512i)__builtin_ia32_pminsb512((__v64qi) __A, (__v64qi) __B);
871 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
879 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
887 return (__m512i)__builtin_ia32_pminsw512((__v32hi) __A, (__v32hi) __B);
893 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
901 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
909 return (__m512i)__builtin_ia32_pminub512((__v64qi)__A, (__v64qi)__B);
915 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
923 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
931 return (__m512i)__builtin_ia32_pminuw512((__v32hi)__A, (__v32hi)__B);
937 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
945 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
953 return (__m512i)__builtin_ia32_pshufb512((__v64qi)__A,(__v64qi)__B);
959 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
967 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
975 return (__m512i)__builtin_ia32_psubsb512((__v64qi)__A, (__v64qi)__B);
981 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
989 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
997 return (__m512i)__builtin_ia32_psubsw512((__v32hi)__A, (__v32hi)__B);
1003 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1011 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1019 return (__m512i)__builtin_ia32_psubusb512((__v64qi) __A, (__v64qi) __B);
1025 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
1033 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
1041 return (__m512i)__builtin_ia32_psubusw512((__v32hi) __A, (__v32hi) __B);
1047 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1055 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1063 return (__m512i)__builtin_ia32_vpermi2varhi512((__v32hi)__A, (__v32hi)__I,
1071 return (__m512i)__builtin_ia32_selectw_512(__U,
1080 return (__m512i)__builtin_ia32_selectw_512(__U,
1089 return (__m512i)__builtin_ia32_selectw_512(__U,
1097 return (__m512i)__builtin_ia32_pmulhrsw512((__v32hi)__A, (__v32hi)__B);
1103 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1111 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1119 return (__m512i)__builtin_ia32_pmulhw512((__v32hi) __A, (__v32hi) __B);
1126 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1134 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1142 return (__m512i)__builtin_ia32_pmulhuw512((__v32hi) __A, (__v32hi) __B);
1148 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1156 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1163 return (__m512i)__builtin_ia32_pmaddubsw512((__v64qi)__X, (__v64qi)__Y);
1169 return (__m512i)__builtin_ia32_selectw_512((
__mmask32) __U,
1176 return (__m512i)__builtin_ia32_selectw_512((
__mmask32) __U,
1183 return (__m512i)__builtin_ia32_pmaddwd512((__v32hi)__A, (__v32hi)__B);
1188 return (__m512i)__builtin_ia32_selectd_512((
__mmask16)__U,
1195 return (__m512i)__builtin_ia32_selectd_512((
__mmask16)__U,
1202 return (__m256i) __builtin_ia32_pmovswb512_mask ((__v32hi) __A,
1209 return (__m256i) __builtin_ia32_pmovswb512_mask ((__v32hi) __A,
1216 return (__m256i) __builtin_ia32_pmovswb512_mask ((__v32hi) __A,
1223 return (__m256i) __builtin_ia32_pmovuswb512_mask ((__v32hi) __A,
1230 return (__m256i) __builtin_ia32_pmovuswb512_mask ((__v32hi) __A,
1237 return (__m256i) __builtin_ia32_pmovuswb512_mask ((__v32hi) __A,
1244 return (__m256i) __builtin_ia32_pmovwb512_mask ((__v32hi) __A,
1251 return (__m256i) __builtin_ia32_pmovwb512_mask ((__v32hi) __A,
1258 return (__m256i) __builtin_ia32_pmovwb512_mask ((__v32hi) __A,
1266 __builtin_ia32_pmovwb512mem_mask ((__v32qi *) __P, (__v32hi) __A, __M);
1272 __builtin_ia32_pmovswb512mem_mask ((__v32qi *) __P, (__v32hi) __A, __M);
1278 __builtin_ia32_pmovuswb512mem_mask ((__v32qi *) __P, (__v32hi) __A, __M);
1283 return (__m512i)__builtin_shufflevector((__v64qi)__A, (__v64qi)__B,
1285 10, 64+10, 11, 64+11,
1286 12, 64+12, 13, 64+13,
1287 14, 64+14, 15, 64+15,
1288 24, 64+24, 25, 64+25,
1289 26, 64+26, 27, 64+27,
1290 28, 64+28, 29, 64+29,
1291 30, 64+30, 31, 64+31,
1292 40, 64+40, 41, 64+41,
1293 42, 64+42, 43, 64+43,
1294 44, 64+44, 45, 64+45,
1295 46, 64+46, 47, 64+47,
1296 56, 64+56, 57, 64+57,
1297 58, 64+58, 59, 64+59,
1298 60, 64+60, 61, 64+61,
1299 62, 64+62, 63, 64+63);
1304 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
1311 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
1318 return (__m512i)__builtin_shufflevector((__v32hi)__A, (__v32hi)__B,
1321 12, 32+12, 13, 32+13,
1322 14, 32+14, 15, 32+15,
1323 20, 32+20, 21, 32+21,
1324 22, 32+22, 23, 32+23,
1325 28, 32+28, 29, 32+29,
1326 30, 32+30, 31, 32+31);
1331 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1338 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1345 return (__m512i)__builtin_shufflevector((__v64qi)__A, (__v64qi)__B,
1350 16, 64+16, 17, 64+17,
1351 18, 64+18, 19, 64+19,
1352 20, 64+20, 21, 64+21,
1353 22, 64+22, 23, 64+23,
1354 32, 64+32, 33, 64+33,
1355 34, 64+34, 35, 64+35,
1356 36, 64+36, 37, 64+37,
1357 38, 64+38, 39, 64+39,
1358 48, 64+48, 49, 64+49,
1359 50, 64+50, 51, 64+51,
1360 52, 64+52, 53, 64+53,
1361 54, 64+54, 55, 64+55);
1366 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
1373 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
1380 return (__m512i)__builtin_shufflevector((__v32hi)__A, (__v32hi)__B,
1384 10, 32+10, 11, 32+11,
1385 16, 32+16, 17, 32+17,
1386 18, 32+18, 19, 32+19,
1387 24, 32+24, 25, 32+25,
1388 26, 32+26, 27, 32+27);
1393 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1400 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1410 return (__m512i)__builtin_convertvector((__v32qs)__A, __v32hi);
1416 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1424 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1432 return (__m512i)__builtin_convertvector((__v32qu)__A, __v32hi);
1438 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1446 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1452 #define _mm512_shufflehi_epi16(A, imm) \ 1453 (__m512i)__builtin_ia32_pshufhw512((__v32hi)(__m512i)(A), (int)(imm)) 1455 #define _mm512_mask_shufflehi_epi16(W, U, A, imm) \ 1456 (__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \ 1457 (__v32hi)_mm512_shufflehi_epi16((A), \ 1459 (__v32hi)(__m512i)(W)) 1461 #define _mm512_maskz_shufflehi_epi16(U, A, imm) \ 1462 (__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \ 1463 (__v32hi)_mm512_shufflehi_epi16((A), \ 1465 (__v32hi)_mm512_setzero_si512()) 1467 #define _mm512_shufflelo_epi16(A, imm) \ 1468 (__m512i)__builtin_ia32_pshuflw512((__v32hi)(__m512i)(A), (int)(imm)) 1471 #define _mm512_mask_shufflelo_epi16(W, U, A, imm) \ 1472 (__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \ 1473 (__v32hi)_mm512_shufflelo_epi16((A), \ 1475 (__v32hi)(__m512i)(W)) 1478 #define _mm512_maskz_shufflelo_epi16(U, A, imm) \ 1479 (__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \ 1480 (__v32hi)_mm512_shufflelo_epi16((A), \ 1482 (__v32hi)_mm512_setzero_si512()) 1487 return (__m512i)__builtin_ia32_psllv32hi((__v32hi) __A, (__v32hi) __B);
1493 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1501 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1509 return (__m512i)__builtin_ia32_psllw512((__v32hi) __A, (__v8hi) __B);
1515 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1523 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1531 return (__m512i)__builtin_ia32_psllwi512((__v32hi)__A, __B);
1537 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1545 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1550 #define _mm512_bslli_epi128(a, imm) \ 1551 (__m512i)__builtin_ia32_pslldqi512_byteshift((__v8di)(__m512i)(a), (int)(imm)) 1556 return (__m512i)__builtin_ia32_psrlv32hi((__v32hi)__A, (__v32hi)__B);
1562 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1570 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1578 return (__m512i)__builtin_ia32_psrav32hi((__v32hi)__A, (__v32hi)__B);
1584 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1592 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1600 return (__m512i)__builtin_ia32_psraw512((__v32hi) __A, (__v8hi) __B);
1606 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1614 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1622 return (__m512i)__builtin_ia32_psrawi512((__v32hi)__A, __B);
1628 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1636 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1644 return (__m512i)__builtin_ia32_psrlw512((__v32hi) __A, (__v8hi) __B);
1650 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1658 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1666 return (__m512i)__builtin_ia32_psrlwi512((__v32hi)__A, __B);
1672 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1680 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1685 #define _mm512_bsrli_epi128(a, imm) \ 1686 (__m512i)__builtin_ia32_psrldqi512_byteshift((__v8di)(__m512i)(a), (int)(imm)) 1691 return (__m512i) __builtin_ia32_selectw_512 ((
__mmask32) __U,
1699 return (__m512i) __builtin_ia32_selectw_512 ((
__mmask32) __U,
1707 return (__m512i) __builtin_ia32_selectb_512 ((
__mmask64) __U,
1715 return (__m512i) __builtin_ia32_selectb_512 ((
__mmask64) __U,
1723 return (__m512i) __builtin_ia32_selectb_512(__M,
1731 return (__m512i) __builtin_ia32_selectb_512(__M,
1753 struct __loadu_epi16 {
1756 return ((
struct __loadu_epi16*)__P)->__v;
1762 return (__m512i) __builtin_ia32_loaddquhi512_mask ((__v32hi *) __P,
1770 return (__m512i) __builtin_ia32_loaddquhi512_mask ((__v32hi *) __P,
1779 struct __loadu_epi8 {
1782 return ((
struct __loadu_epi8*)__P)->__v;
1788 return (__m512i) __builtin_ia32_loaddquqi512_mask ((__v64qi *) __P,
1796 return (__m512i) __builtin_ia32_loaddquqi512_mask ((__v64qi *) __P,
1805 struct __storeu_epi16 {
1808 ((
struct __storeu_epi16*)__P)->__v = __A;
1814 __builtin_ia32_storedquhi512_mask ((__v32hi *) __P,
1822 struct __storeu_epi8 {
1825 ((
struct __storeu_epi8*)__P)->__v = __A;
1831 __builtin_ia32_storedquqi512_mask ((__v64qi *) __P,
1894 return (
__mmask64) __builtin_ia32_cvtb2mask512 ((__v64qi) __A);
1900 return (
__mmask32) __builtin_ia32_cvtw2mask512 ((__v32hi) __A);
1906 return (__m512i) __builtin_ia32_cvtmask2b512 (__A);
1912 return (__m512i) __builtin_ia32_cvtmask2w512 (__A);
1918 return (__m512i)__builtin_shufflevector((__v16qi) __A, (__v16qi) __A,
1919 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1920 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1921 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1922 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0);
1928 return (__m512i)__builtin_ia32_selectb_512(__M,
1936 return (__m512i)__builtin_ia32_selectb_512(__M,
1944 return (__m512i) __builtin_ia32_selectw_512(__M,
1952 return (__m512i) __builtin_ia32_selectw_512(__M,
1960 return (__m512i)__builtin_shufflevector((__v8hi) __A, (__v8hi) __A,
1961 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1962 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0);
1968 return (__m512i)__builtin_ia32_selectw_512(__M,
1976 return (__m512i)__builtin_ia32_selectw_512(__M,
1984 return (__m512i)__builtin_ia32_permvarhi512((__v32hi)__B, (__v32hi)__A);
1991 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
2000 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
2005 #define _mm512_alignr_epi8(A, B, N) \ 2006 (__m512i)__builtin_ia32_palignr512((__v64qi)(__m512i)(A), \ 2007 (__v64qi)(__m512i)(B), (int)(N)) 2009 #define _mm512_mask_alignr_epi8(W, U, A, B, N) \ 2010 (__m512i)__builtin_ia32_selectb_512((__mmask64)(U), \ 2011 (__v64qi)_mm512_alignr_epi8((A), (B), (int)(N)), \ 2012 (__v64qi)(__m512i)(W)) 2014 #define _mm512_maskz_alignr_epi8(U, A, B, N) \ 2015 (__m512i)__builtin_ia32_selectb_512((__mmask64)(U), \ 2016 (__v64qi)_mm512_alignr_epi8((A), (B), (int)(N)), \ 2017 (__v64qi)(__m512i)_mm512_setzero_si512()) 2019 #define _mm512_dbsad_epu8(A, B, imm) \ 2020 (__m512i)__builtin_ia32_dbpsadbw512((__v64qi)(__m512i)(A), \ 2021 (__v64qi)(__m512i)(B), (int)(imm)) 2023 #define _mm512_mask_dbsad_epu8(W, U, A, B, imm) \ 2024 (__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \ 2025 (__v32hi)_mm512_dbsad_epu8((A), (B), (imm)), \ 2026 (__v32hi)(__m512i)(W)) 2028 #define _mm512_maskz_dbsad_epu8(U, A, B, imm) \ 2029 (__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \ 2030 (__v32hi)_mm512_dbsad_epu8((A), (B), (imm)), \ 2031 (__v32hi)_mm512_setzero_si512()) 2036 return (__m512i) __builtin_ia32_psadbw512 ((__v64qi) __A,
2040 #undef __DEFAULT_FN_ATTRS512 2041 #undef __DEFAULT_FN_ATTRS static __inline__ __mmask64 __DEFAULT_FN_ATTRS512 _mm512_mask_testn_epi8_mask(__mmask64 __U, __m512i __A, __m512i __B)
#define _mm512_cmpeq_epi16_mask(A, B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_adds_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_min_epi8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_unpackhi_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_max_epu8(__m512i __W, __mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_subs_epu16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_sad_epu8(__m512i __A, __m512i __B)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS _kxnor_mask32(__mmask32 __A, __mmask32 __B)
static __inline __m512i __DEFAULT_FN_ATTRS512 _mm512_loadu_epi8(void const *__P)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_mullo_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_mulhi_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_avg_epu16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_mulhi_epu16(__mmask32 __U, __m512i __A, __m512i __B)
struct __storeu_i16 *__P __v
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_unpacklo_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS _kand_mask64(__mmask64 __A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_avg_epu16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline void __DEFAULT_FN_ATTRS512 _mm512_storeu_epi16(void *__P, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_unpackhi_epi8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_slli_epi16(__mmask32 __U, __m512i __A, int __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS _kadd_mask64(__mmask64 __A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_unpackhi_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS512 _mm512_kunpackd(__mmask64 __A, __mmask64 __B)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS _load_mask32(__mmask32 *__A)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS512 _mm512_mask_test_epi16_mask(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ void __DEFAULT_FN_ATTRS _store_mask64(__mmask64 *__A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_packus_epi16(__m512i __A, __m512i __B)
vector signed char unaligned_vec_schar __attribute__((aligned(1)))
Zeroes the upper 128 bits (bits 255:128) of all YMM registers.
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_srai_epi16(__m512i __W, __mmask32 __U, __m512i __A, int __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_sub_epi8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_packs_epi32(__mmask32 __M, __m512i __A, __m512i __B)
#define _mm512_mask_cmpneq_epi8_mask(k, A, B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_sllv_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_cvtepu8_epi16(__mmask32 __U, __m256i __A)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS _kand_mask32(__mmask32 __A, __mmask32 __B)
#define _mm512_mask_cmpneq_epi16_mask(k, A, B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_sllv_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_subs_epu8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_srlv_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_sub_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_subs_epi8(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_add_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_srl_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m128i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_sub_epi8(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_permutex2var_epi16(__m512i __A, __m512i __I, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_abs_epi16(__m512i __W, __mmask32 __U, __m512i __A)
static __inline__ unsigned long long __DEFAULT_FN_ATTRS _cvtmask64_u64(__mmask64 __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_avg_epu8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_unpacklo_epi8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_mov_epi16(__mmask32 __U, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_adds_epi8(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_cvtepi8_epi16(__m256i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_srai_epi16(__m512i __A, int __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS512 _mm512_test_epi8_mask(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_abs_epi16(__mmask32 __U, __m512i __A)
static __inline__ void __DEFAULT_FN_ATTRS _store_mask32(__mmask32 *__A, __mmask32 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_cvtepi8_epi16(__m512i __W, __mmask32 __U, __m256i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_shuffle_epi8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_and_epi32(__m512i __a, __m512i __b)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_subs_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_max_epi8(__m512i __W, __mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_adds_epu16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_add_epi8(__m512i __A, __m512i __B)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _kortestc_mask32_u8(__mmask32 __A, __mmask32 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_broadcastb_epi8(__m512i __O, __mmask64 __M, __m128i __A)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS _kadd_mask32(__mmask32 __A, __mmask32 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_set1_epi8(__m512i __O, __mmask64 __M, char __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_blend_epi8(__mmask64 __U, __m512i __A, __m512i __W)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_permutexvar_epi16(__mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_srli_epi16(__mmask32 __U, __m512i __A, int __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_broadcastb_epi8(__m128i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_avg_epu8(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_unpackhi_epi8(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_add_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_max_epu8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_unpacklo_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m256i __DEFAULT_FN_ATTRS512 _mm512_cvtusepi16_epi8(__m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_abs_epi16(__m512i __A)
static __inline__ void __DEFAULT_FN_ATTRS512 _mm512_mask_cvtusepi16_storeu_epi8(void *__P, __mmask32 __M, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_shuffle_epi8(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_max_epi16(__mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_cvtepu8_epi16(__m256i __A)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS _cvtu64_mask64(unsigned long long __A)
static __inline__ __m256i __DEFAULT_FN_ATTRS _mm256_undefined_si256(void)
Create a 256-bit integer vector with undefined values.
static __inline__ __mmask32 __DEFAULT_FN_ATTRS _kxor_mask32(__mmask32 __A, __mmask32 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_max_epu16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_permutexvar_epi16(__m512i __A, __m512i __B)
static __inline__ __m256i __DEFAULT_FN_ATTRS512 _mm512_mask_cvtepi16_epi8(__m256i __O, __mmask32 __M, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_packs_epi16(__m512i __A, __m512i __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS512 _mm512_testn_epi8_mask(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_mov_epi8(__m512i __W, __mmask64 __U, __m512i __A)
static __inline __m512i __DEFAULT_FN_ATTRS512 _mm512_setzero_si512(void)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _ktestz_mask32_u8(__mmask32 __A, __mmask32 __B)
#define _mm512_cmpneq_epi16_mask(A, B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_min_epu8(__mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_min_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_set1_epi16(__m512i __O, __mmask32 __M, short __A)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _ktestc_mask32_u8(__mmask32 __A, __mmask32 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_subs_epu16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_mulhrs_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS512 _mm512_test_epi16_mask(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_sll_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m128i __B)
#define _mm512_cmpeq_epi8_mask(A, B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS _kxnor_mask64(__mmask64 __A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_mulhi_epu16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _kortest_mask32_u8(__mmask32 __A, __mmask32 __B, unsigned char *__C)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_subs_epi8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_min_epi8(__m512i __W, __mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_mulhi_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_adds_epu8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m256i __DEFAULT_FN_ATTRS512 _mm512_cvtsepi16_epi8(__m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_max_epi8(__m512i __A, __m512i __B)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _kortestz_mask64_u8(__mmask64 __A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_unpacklo_epi8(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS _kandn_mask32(__mmask32 __A, __mmask32 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_broadcastw_epi16(__m128i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_add_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_packus_epi16(__mmask64 __M, __m512i __A, __m512i __B)
#define __DEFAULT_FN_ATTRS
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_sub_epi8(__m512i __A, __m512i __B)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _kortest_mask64_u8(__mmask64 __A, __mmask64 __B, unsigned char *__C)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_max_epu8(__mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_srav_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_srai_epi16(__mmask32 __U, __m512i __A, int __B)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS _kor_mask32(__mmask32 __A, __mmask32 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_unpackhi_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_max_epu16(__mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS512 _mm512_testn_epi16_mask(__m512i __A, __m512i __B)
unsigned long long __mmask64
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_sra_epi16(__mmask32 __U, __m512i __A, __m128i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_shuffle_epi8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_subs_epi8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline __mmask32 __DEFAULT_FN_ATTRS _knot_mask32(__mmask32 __M)
static __inline__ void __DEFAULT_FN_ATTRS512 _mm512_mask_cvtsepi16_storeu_epi8(void *__P, __mmask32 __M, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_abs_epi8(__m512i __A)
#define _mm512_cmpneq_epi8_mask(A, B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_packus_epi32(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_slli_epi16(__m512i __W, __mmask32 __U, __m512i __A, int __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_min_epu8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_broadcastw_epi16(__m512i __O, __mmask32 __M, __m128i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_srli_epi16(__m512i __A, int __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS512 _mm512_movepi8_mask(__m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_subs_epu8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_subs_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_srl_epi16(__mmask32 __U, __m512i __A, __m128i __B)
static __inline__ void __DEFAULT_FN_ATTRS512 _mm512_mask_storeu_epi8(void *__P, __mmask64 __U, __m512i __A)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS _kandn_mask64(__mmask64 __A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_adds_epi8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_min_epi16(__mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_subs_epu8(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_srlv_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_broadcastb_epi8(__mmask64 __M, __m128i __A)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS _load_mask64(__mmask64 *__A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_unpacklo_epi16(__m512i __A, __m512i __B)
static __inline __m512i __DEFAULT_FN_ATTRS512 _mm512_set1_epi8(char __w)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_abs_epi8(__m512i __W, __mmask64 __U, __m512i __A)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _ktest_mask32_u8(__mmask32 __A, __mmask32 __B, unsigned char *__C)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_min_epu8(__m512i __W, __mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_madd_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_loadu_epi16(__m512i __W, __mmask32 __U, void const *__P)
static __inline__ void __DEFAULT_FN_ATTRS512 _mm512_mask_cvtepi16_storeu_epi8(void *__P, __mmask32 __M, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_cvtepu8_epi16(__m512i __W, __mmask32 __U, __m256i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_permutex2var_epi16(__mmask32 __U, __m512i __A, __m512i __I, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_packs_epi32(__m512i __W, __mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_abs_epi8(__mmask64 __U, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_packs_epi16(__mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_loadu_epi8(__mmask64 __U, void const *__P)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_permutexvar_epi16(__m512i __W, __mmask32 __M, __m512i __A, __m512i __B)
static __inline__ unsigned int __DEFAULT_FN_ATTRS _cvtmask32_u32(__mmask32 __A)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS _cvtu32_mask32(unsigned int __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_adds_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m256i __DEFAULT_FN_ATTRS512 _mm512_mask_cvtusepi16_epi8(__m256i __O, __mmask32 __M, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_mullo_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_slli_epi16(__m512i __A, int __B)
static __inline__ void __DEFAULT_FN_ATTRS512 _mm512_mask_storeu_epi16(void *__P, __mmask32 __U, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_avg_epu8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline void __DEFAULT_FN_ATTRS512 _mm512_storeu_epi8(void *__P, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_sub_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_srav_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mullo_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_blend_epi16(__mmask32 __U, __m512i __A, __m512i __W)
#define __DEFAULT_FN_ATTRS512
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_sll_epi16(__mmask32 __U, __m512i __A, __m128i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_adds_epu16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_min_epi8(__mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS512 _mm512_kunpackw(__mmask32 __A, __mmask32 __B)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _kortestc_mask64_u8(__mmask64 __A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_set1_epi16(__mmask32 __M, short __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_sra_epi16(__m512i __A, __m128i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_max_epu16(__m512i __W, __mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS512 _mm512_mask_testn_epi16_mask(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_max_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_maddubs_epi16(__mmask32 __U, __m512i __X, __m512i __Y)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_movm_epi16(__mmask32 __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_packs_epi16(__m512i __W, __mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_mov_epi16(__m512i __W, __mmask32 __U, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_add_epi8(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_adds_epu8(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_adds_epi16(__m512i __A, __m512i __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS _kor_mask64(__mmask64 __A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_subs_epu16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_srli_epi16(__m512i __W, __mmask32 __U, __m512i __A, int __B)
static __inline__ __m256i __DEFAULT_FN_ATTRS512 _mm512_cvtepi16_epi8(__m512i __A)
static __inline__ __m256i __DEFAULT_FN_ATTRS512 _mm512_maskz_cvtepi16_epi8(__mmask32 __M, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_packus_epi32(__mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS _kxor_mask64(__mmask64 __A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_adds_epu8(__m512i __A, __m512i __B)
static __inline__ __m256i __DEFAULT_FN_ATTRS512 _mm512_mask_cvtsepi16_epi8(__m256i __O, __mmask32 __M, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_srl_epi16(__m512i __A, __m128i __B)
static __inline__ __m256i __DEFAULT_FN_ATTRS512 _mm512_maskz_cvtsepi16_epi8(__mmask32 __M, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_broadcastw_epi16(__mmask32 __M, __m128i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_mulhrs_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline __mmask64 __DEFAULT_FN_ATTRS _knot_mask64(__mmask64 __M)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_maddubs_epi16(__m512i __W, __mmask32 __U, __m512i __X, __m512i __Y)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_min_epu16(__m512i __W, __mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_packus_epi32(__m512i __W, __mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_srav_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS512 _mm512_mask_test_epi8_mask(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_movm_epi8(__mmask64 __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_unpacklo_epi8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_max_epi16(__m512i __W, __mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_avg_epu16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_permutex2var_epi16(__m512i __A, __mmask32 __U, __m512i __I, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_adds_epi8(__m512i __A, __m512i __B)
static __inline __m256i __DEFAULT_FN_ATTRS _mm256_setzero_si256(void)
Constructs a 256-bit integer vector initialized to zero.
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mulhi_epu16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_min_epu16(__mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_loadu_epi16(__mmask32 __U, void const *__P)
#define _mm512_mask_cmpeq_epi8_mask(k, A, B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maddubs_epi16(__m512i __X, __m512i __Y)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_unpackhi_epi8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_sll_epi16(__m512i __A, __m128i __B)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _ktestc_mask64_u8(__mmask64 __A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_max_epi8(__mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_cvtepi8_epi16(__mmask32 __U, __m256i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mulhrs_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_set1_epi8(__mmask64 __M, char __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_mov_epi8(__mmask64 __U, __m512i __A)
static __inline __m512i __DEFAULT_FN_ATTRS512 _mm512_set1_epi16(short __w)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_adds_epu16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_madd_epi16(__m512i __W, __mmask16 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_srlv_epi16(__m512i __A, __m512i __B)
#define _mm512_mask_cmpeq_epi16_mask(k, A, B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_sllv_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_sra_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m128i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_sub_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _ktest_mask64_u8(__mmask64 __A, __mmask64 __B, unsigned char *__C)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _ktestz_mask64_u8(__mmask64 __A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_loadu_epi8(__m512i __W, __mmask64 __U, void const *__P)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _kortestz_mask32_u8(__mmask32 __A, __mmask32 __B)
static __inline __m512i __DEFAULT_FN_ATTRS512 _mm512_loadu_epi16(void const *__P)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_packus_epi16(__m512i __W, __mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_min_epu16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_subs_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS512 _mm512_movepi16_mask(__m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_madd_epi16(__mmask16 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask2_permutex2var_epi16(__m512i __A, __m512i __I, __mmask32 __U, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_add_epi8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_min_epi16(__m512i __W, __mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __m256i __DEFAULT_FN_ATTRS512 _mm512_maskz_cvtusepi16_epi8(__mmask32 __M, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mulhi_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_packs_epi32(__m512i __A, __m512i __B)