11#error "Never use <avx512bwintrin.h> directly; include <immintrin.h> instead."
14#ifndef __AVX512BWINTRIN_H
15#define __AVX512BWINTRIN_H
21#define __DEFAULT_FN_ATTRS512 \
22 __attribute__((__always_inline__, __nodebug__, \
23 __target__("avx512bw,evex512"), __min_vector_width__(512)))
24#define __DEFAULT_FN_ATTRS \
25 __attribute__((__always_inline__, __nodebug__, \
26 __target__("avx512bw,no-evex512")))
31 return __builtin_ia32_knotsi(__M);
35 return __builtin_ia32_knotdi(__M);
96 return (
unsigned char)__builtin_ia32_kortestcsi(__A, __B);
102 return (
unsigned char)__builtin_ia32_kortestzsi(__A, __B);
107 *__C = (
unsigned char)__builtin_ia32_kortestcsi(__A, __B);
108 return (
unsigned char)__builtin_ia32_kortestzsi(__A, __B);
113 return (
unsigned char)__builtin_ia32_kortestcdi(__A, __B);
118 return (
unsigned char)__builtin_ia32_kortestzdi(__A, __B);
123 *__C = (
unsigned char)__builtin_ia32_kortestcdi(__A, __B);
124 return (
unsigned char)__builtin_ia32_kortestzdi(__A, __B);
130 return (
unsigned char)__builtin_ia32_ktestcsi(__A, __B);
136 return (
unsigned char)__builtin_ia32_ktestzsi(__A, __B);
141 *__C = (
unsigned char)__builtin_ia32_ktestcsi(__A, __B);
142 return (
unsigned char)__builtin_ia32_ktestzsi(__A, __B);
147 return (
unsigned char)__builtin_ia32_ktestcdi(__A, __B);
152 return (
unsigned char)__builtin_ia32_ktestzdi(__A, __B);
157 *__C = (
unsigned char)__builtin_ia32_ktestcdi(__A, __B);
158 return (
unsigned char)__builtin_ia32_ktestzdi(__A, __B);
172#define _kshiftli_mask32(A, I) \
173 ((__mmask32)__builtin_ia32_kshiftlisi((__mmask32)(A), (unsigned int)(I)))
175#define _kshiftri_mask32(A, I) \
176 ((__mmask32)__builtin_ia32_kshiftrisi((__mmask32)(A), (unsigned int)(I)))
178#define _kshiftli_mask64(A, I) \
179 ((__mmask64)__builtin_ia32_kshiftlidi((__mmask64)(A), (unsigned int)(I)))
181#define _kshiftri_mask64(A, I) \
182 ((__mmask64)__builtin_ia32_kshiftridi((__mmask64)(A), (unsigned int)(I)))
186 return (
unsigned int)__builtin_ia32_kmovd((
__mmask32)__A);
191 return (
unsigned long long)__builtin_ia32_kmovq((
__mmask64)__A);
225#define _mm512_cmp_epi8_mask(a, b, p) \
226 ((__mmask64)__builtin_ia32_cmpb512_mask((__v64qi)(__m512i)(a), \
227 (__v64qi)(__m512i)(b), (int)(p), \
230#define _mm512_mask_cmp_epi8_mask(m, a, b, p) \
231 ((__mmask64)__builtin_ia32_cmpb512_mask((__v64qi)(__m512i)(a), \
232 (__v64qi)(__m512i)(b), (int)(p), \
235#define _mm512_cmp_epu8_mask(a, b, p) \
236 ((__mmask64)__builtin_ia32_ucmpb512_mask((__v64qi)(__m512i)(a), \
237 (__v64qi)(__m512i)(b), (int)(p), \
240#define _mm512_mask_cmp_epu8_mask(m, a, b, p) \
241 ((__mmask64)__builtin_ia32_ucmpb512_mask((__v64qi)(__m512i)(a), \
242 (__v64qi)(__m512i)(b), (int)(p), \
245#define _mm512_cmp_epi16_mask(a, b, p) \
246 ((__mmask32)__builtin_ia32_cmpw512_mask((__v32hi)(__m512i)(a), \
247 (__v32hi)(__m512i)(b), (int)(p), \
250#define _mm512_mask_cmp_epi16_mask(m, a, b, p) \
251 ((__mmask32)__builtin_ia32_cmpw512_mask((__v32hi)(__m512i)(a), \
252 (__v32hi)(__m512i)(b), (int)(p), \
255#define _mm512_cmp_epu16_mask(a, b, p) \
256 ((__mmask32)__builtin_ia32_ucmpw512_mask((__v32hi)(__m512i)(a), \
257 (__v32hi)(__m512i)(b), (int)(p), \
260#define _mm512_mask_cmp_epu16_mask(m, a, b, p) \
261 ((__mmask32)__builtin_ia32_ucmpw512_mask((__v32hi)(__m512i)(a), \
262 (__v32hi)(__m512i)(b), (int)(p), \
265#define _mm512_cmpeq_epi8_mask(A, B) \
266 _mm512_cmp_epi8_mask((A), (B), _MM_CMPINT_EQ)
267#define _mm512_mask_cmpeq_epi8_mask(k, A, B) \
268 _mm512_mask_cmp_epi8_mask((k), (A), (B), _MM_CMPINT_EQ)
269#define _mm512_cmpge_epi8_mask(A, B) \
270 _mm512_cmp_epi8_mask((A), (B), _MM_CMPINT_GE)
271#define _mm512_mask_cmpge_epi8_mask(k, A, B) \
272 _mm512_mask_cmp_epi8_mask((k), (A), (B), _MM_CMPINT_GE)
273#define _mm512_cmpgt_epi8_mask(A, B) \
274 _mm512_cmp_epi8_mask((A), (B), _MM_CMPINT_GT)
275#define _mm512_mask_cmpgt_epi8_mask(k, A, B) \
276 _mm512_mask_cmp_epi8_mask((k), (A), (B), _MM_CMPINT_GT)
277#define _mm512_cmple_epi8_mask(A, B) \
278 _mm512_cmp_epi8_mask((A), (B), _MM_CMPINT_LE)
279#define _mm512_mask_cmple_epi8_mask(k, A, B) \
280 _mm512_mask_cmp_epi8_mask((k), (A), (B), _MM_CMPINT_LE)
281#define _mm512_cmplt_epi8_mask(A, B) \
282 _mm512_cmp_epi8_mask((A), (B), _MM_CMPINT_LT)
283#define _mm512_mask_cmplt_epi8_mask(k, A, B) \
284 _mm512_mask_cmp_epi8_mask((k), (A), (B), _MM_CMPINT_LT)
285#define _mm512_cmpneq_epi8_mask(A, B) \
286 _mm512_cmp_epi8_mask((A), (B), _MM_CMPINT_NE)
287#define _mm512_mask_cmpneq_epi8_mask(k, A, B) \
288 _mm512_mask_cmp_epi8_mask((k), (A), (B), _MM_CMPINT_NE)
290#define _mm512_cmpeq_epu8_mask(A, B) \
291 _mm512_cmp_epu8_mask((A), (B), _MM_CMPINT_EQ)
292#define _mm512_mask_cmpeq_epu8_mask(k, A, B) \
293 _mm512_mask_cmp_epu8_mask((k), (A), (B), _MM_CMPINT_EQ)
294#define _mm512_cmpge_epu8_mask(A, B) \
295 _mm512_cmp_epu8_mask((A), (B), _MM_CMPINT_GE)
296#define _mm512_mask_cmpge_epu8_mask(k, A, B) \
297 _mm512_mask_cmp_epu8_mask((k), (A), (B), _MM_CMPINT_GE)
298#define _mm512_cmpgt_epu8_mask(A, B) \
299 _mm512_cmp_epu8_mask((A), (B), _MM_CMPINT_GT)
300#define _mm512_mask_cmpgt_epu8_mask(k, A, B) \
301 _mm512_mask_cmp_epu8_mask((k), (A), (B), _MM_CMPINT_GT)
302#define _mm512_cmple_epu8_mask(A, B) \
303 _mm512_cmp_epu8_mask((A), (B), _MM_CMPINT_LE)
304#define _mm512_mask_cmple_epu8_mask(k, A, B) \
305 _mm512_mask_cmp_epu8_mask((k), (A), (B), _MM_CMPINT_LE)
306#define _mm512_cmplt_epu8_mask(A, B) \
307 _mm512_cmp_epu8_mask((A), (B), _MM_CMPINT_LT)
308#define _mm512_mask_cmplt_epu8_mask(k, A, B) \
309 _mm512_mask_cmp_epu8_mask((k), (A), (B), _MM_CMPINT_LT)
310#define _mm512_cmpneq_epu8_mask(A, B) \
311 _mm512_cmp_epu8_mask((A), (B), _MM_CMPINT_NE)
312#define _mm512_mask_cmpneq_epu8_mask(k, A, B) \
313 _mm512_mask_cmp_epu8_mask((k), (A), (B), _MM_CMPINT_NE)
315#define _mm512_cmpeq_epi16_mask(A, B) \
316 _mm512_cmp_epi16_mask((A), (B), _MM_CMPINT_EQ)
317#define _mm512_mask_cmpeq_epi16_mask(k, A, B) \
318 _mm512_mask_cmp_epi16_mask((k), (A), (B), _MM_CMPINT_EQ)
319#define _mm512_cmpge_epi16_mask(A, B) \
320 _mm512_cmp_epi16_mask((A), (B), _MM_CMPINT_GE)
321#define _mm512_mask_cmpge_epi16_mask(k, A, B) \
322 _mm512_mask_cmp_epi16_mask((k), (A), (B), _MM_CMPINT_GE)
323#define _mm512_cmpgt_epi16_mask(A, B) \
324 _mm512_cmp_epi16_mask((A), (B), _MM_CMPINT_GT)
325#define _mm512_mask_cmpgt_epi16_mask(k, A, B) \
326 _mm512_mask_cmp_epi16_mask((k), (A), (B), _MM_CMPINT_GT)
327#define _mm512_cmple_epi16_mask(A, B) \
328 _mm512_cmp_epi16_mask((A), (B), _MM_CMPINT_LE)
329#define _mm512_mask_cmple_epi16_mask(k, A, B) \
330 _mm512_mask_cmp_epi16_mask((k), (A), (B), _MM_CMPINT_LE)
331#define _mm512_cmplt_epi16_mask(A, B) \
332 _mm512_cmp_epi16_mask((A), (B), _MM_CMPINT_LT)
333#define _mm512_mask_cmplt_epi16_mask(k, A, B) \
334 _mm512_mask_cmp_epi16_mask((k), (A), (B), _MM_CMPINT_LT)
335#define _mm512_cmpneq_epi16_mask(A, B) \
336 _mm512_cmp_epi16_mask((A), (B), _MM_CMPINT_NE)
337#define _mm512_mask_cmpneq_epi16_mask(k, A, B) \
338 _mm512_mask_cmp_epi16_mask((k), (A), (B), _MM_CMPINT_NE)
340#define _mm512_cmpeq_epu16_mask(A, B) \
341 _mm512_cmp_epu16_mask((A), (B), _MM_CMPINT_EQ)
342#define _mm512_mask_cmpeq_epu16_mask(k, A, B) \
343 _mm512_mask_cmp_epu16_mask((k), (A), (B), _MM_CMPINT_EQ)
344#define _mm512_cmpge_epu16_mask(A, B) \
345 _mm512_cmp_epu16_mask((A), (B), _MM_CMPINT_GE)
346#define _mm512_mask_cmpge_epu16_mask(k, A, B) \
347 _mm512_mask_cmp_epu16_mask((k), (A), (B), _MM_CMPINT_GE)
348#define _mm512_cmpgt_epu16_mask(A, B) \
349 _mm512_cmp_epu16_mask((A), (B), _MM_CMPINT_GT)
350#define _mm512_mask_cmpgt_epu16_mask(k, A, B) \
351 _mm512_mask_cmp_epu16_mask((k), (A), (B), _MM_CMPINT_GT)
352#define _mm512_cmple_epu16_mask(A, B) \
353 _mm512_cmp_epu16_mask((A), (B), _MM_CMPINT_LE)
354#define _mm512_mask_cmple_epu16_mask(k, A, B) \
355 _mm512_mask_cmp_epu16_mask((k), (A), (B), _MM_CMPINT_LE)
356#define _mm512_cmplt_epu16_mask(A, B) \
357 _mm512_cmp_epu16_mask((A), (B), _MM_CMPINT_LT)
358#define _mm512_mask_cmplt_epu16_mask(k, A, B) \
359 _mm512_mask_cmp_epu16_mask((k), (A), (B), _MM_CMPINT_LT)
360#define _mm512_cmpneq_epu16_mask(A, B) \
361 _mm512_cmp_epu16_mask((A), (B), _MM_CMPINT_NE)
362#define _mm512_mask_cmpneq_epu16_mask(k, A, B) \
363 _mm512_mask_cmp_epu16_mask((k), (A), (B), _MM_CMPINT_NE)
367 return (__m512i) ((__v64qu) __A + (__v64qu) __B);
372 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
379 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
386 return (__m512i) ((__v64qu) __A - (__v64qu) __B);
391 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
398 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
405 return (__m512i) ((__v32hu) __A + (__v32hu) __B);
410 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
417 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
424 return (__m512i) ((__v32hu) __A - (__v32hu) __B);
429 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
436 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
443 return (__m512i) ((__v32hu) __A * (__v32hu) __B);
448 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
455 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
463 return (__m512i) __builtin_ia32_selectb_512 ((
__mmask64) __U,
471 return (__m512i) __builtin_ia32_selectw_512 ((
__mmask32) __U,
479 return (__m512i)__builtin_elementwise_abs((__v64qs)__A);
485 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
493 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
501 return (__m512i)__builtin_elementwise_abs((__v32hi)__A);
507 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
515 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
523 return (__m512i)__builtin_ia32_packssdw512((__v16si)__A, (__v16si)__B);
529 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
537 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
545 return (__m512i)__builtin_ia32_packsswb512((__v32hi)__A, (__v32hi) __B);
551 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
559 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
567 return (__m512i)__builtin_ia32_packusdw512((__v16si) __A, (__v16si) __B);
573 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
581 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
589 return (__m512i)__builtin_ia32_packuswb512((__v32hi) __A, (__v32hi) __B);
595 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
603 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
611 return (__m512i)__builtin_elementwise_add_sat((__v64qs)__A, (__v64qs)__B);
617 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
625 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
633 return (__m512i)__builtin_elementwise_add_sat((__v32hi)__A, (__v32hi)__B);
639 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
647 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
655 return (__m512i)__builtin_elementwise_add_sat((__v64qu) __A, (__v64qu) __B);
661 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
669 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
677 return (__m512i)__builtin_elementwise_add_sat((__v32hu) __A, (__v32hu) __B);
683 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
691 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
699 return (__m512i)__builtin_ia32_pavgb512((__v64qi)__A, (__v64qi)__B);
706 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
714 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
722 return (__m512i)__builtin_ia32_pavgw512((__v32hi)__A, (__v32hi)__B);
729 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
737 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
745 return (__m512i)__builtin_elementwise_max((__v64qs) __A, (__v64qs) __B);
751 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
759 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
767 return (__m512i)__builtin_elementwise_max((__v32hi) __A, (__v32hi) __B);
773 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
782 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
790 return (__m512i)__builtin_elementwise_max((__v64qu)__A, (__v64qu)__B);
796 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
804 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
812 return (__m512i)__builtin_elementwise_max((__v32hu)__A, (__v32hu)__B);
818 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
826 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
834 return (__m512i)__builtin_elementwise_min((__v64qs) __A, (__v64qs) __B);
840 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
848 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
856 return (__m512i)__builtin_elementwise_min((__v32hi) __A, (__v32hi) __B);
862 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
870 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
878 return (__m512i)__builtin_elementwise_min((__v64qu)__A, (__v64qu)__B);
884 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
892 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__M,
900 return (__m512i)__builtin_elementwise_min((__v32hu)__A, (__v32hu)__B);
906 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
914 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
922 return (__m512i)__builtin_ia32_pshufb512((__v64qi)__A,(__v64qi)__B);
928 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
936 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
944 return (__m512i)__builtin_elementwise_sub_sat((__v64qs)__A, (__v64qs)__B);
950 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
958 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
966 return (__m512i)__builtin_elementwise_sub_sat((__v32hi)__A, (__v32hi)__B);
972 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
980 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
988 return (__m512i)__builtin_elementwise_sub_sat((__v64qu) __A, (__v64qu) __B);
994 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
1002 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
1010 return (__m512i)__builtin_elementwise_sub_sat((__v32hu) __A, (__v32hu) __B);
1016 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1024 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1032 return (__m512i)__builtin_ia32_vpermi2varhi512((__v32hi)__A, (__v32hi)__I,
1040 return (__m512i)__builtin_ia32_selectw_512(__U,
1049 return (__m512i)__builtin_ia32_selectw_512(__U,
1058 return (__m512i)__builtin_ia32_selectw_512(__U,
1066 return (__m512i)__builtin_ia32_pmulhrsw512((__v32hi)__A, (__v32hi)__B);
1072 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1080 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1088 return (__m512i)__builtin_ia32_pmulhw512((__v32hi) __A, (__v32hi) __B);
1095 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1103 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1111 return (__m512i)__builtin_ia32_pmulhuw512((__v32hi) __A, (__v32hi) __B);
1117 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1125 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1132 return (__m512i)__builtin_ia32_pmaddubsw512((__v64qi)__X, (__v64qi)
__Y);
1138 return (__m512i)__builtin_ia32_selectw_512((
__mmask32) __U,
1145 return (__m512i)__builtin_ia32_selectw_512((
__mmask32) __U,
1152 return (__m512i)__builtin_ia32_pmaddwd512((__v32hi)__A, (__v32hi)__B);
1157 return (__m512i)__builtin_ia32_selectd_512((
__mmask16)__U,
1164 return (__m512i)__builtin_ia32_selectd_512((
__mmask16)__U,
1171 return (__m256i) __builtin_ia32_pmovswb512_mask ((__v32hi) __A,
1178 return (__m256i) __builtin_ia32_pmovswb512_mask ((__v32hi) __A,
1185 return (__m256i) __builtin_ia32_pmovswb512_mask ((__v32hi) __A,
1192 return (__m256i) __builtin_ia32_pmovuswb512_mask ((__v32hi) __A,
1199 return (__m256i) __builtin_ia32_pmovuswb512_mask ((__v32hi) __A,
1206 return (__m256i) __builtin_ia32_pmovuswb512_mask ((__v32hi) __A,
1213 return (__m256i) __builtin_ia32_pmovwb512_mask ((__v32hi) __A,
1220 return (__m256i) __builtin_ia32_pmovwb512_mask ((__v32hi) __A,
1227 return (__m256i) __builtin_ia32_pmovwb512_mask ((__v32hi) __A,
1235 __builtin_ia32_pmovwb512mem_mask ((__v32qi *)
__P, (__v32hi) __A, __M);
1241 __builtin_ia32_pmovswb512mem_mask ((__v32qi *)
__P, (__v32hi) __A, __M);
1247 __builtin_ia32_pmovuswb512mem_mask ((__v32qi *)
__P, (__v32hi) __A, __M);
1252 return (__m512i)__builtin_shufflevector((__v64qi)__A, (__v64qi)__B,
1254 10, 64+10, 11, 64+11,
1255 12, 64+12, 13, 64+13,
1256 14, 64+14, 15, 64+15,
1257 24, 64+24, 25, 64+25,
1258 26, 64+26, 27, 64+27,
1259 28, 64+28, 29, 64+29,
1260 30, 64+30, 31, 64+31,
1261 40, 64+40, 41, 64+41,
1262 42, 64+42, 43, 64+43,
1263 44, 64+44, 45, 64+45,
1264 46, 64+46, 47, 64+47,
1265 56, 64+56, 57, 64+57,
1266 58, 64+58, 59, 64+59,
1267 60, 64+60, 61, 64+61,
1268 62, 64+62, 63, 64+63);
1273 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
1280 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
1287 return (__m512i)__builtin_shufflevector((__v32hi)__A, (__v32hi)__B,
1290 12, 32+12, 13, 32+13,
1291 14, 32+14, 15, 32+15,
1292 20, 32+20, 21, 32+21,
1293 22, 32+22, 23, 32+23,
1294 28, 32+28, 29, 32+29,
1295 30, 32+30, 31, 32+31);
1300 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1307 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1314 return (__m512i)__builtin_shufflevector((__v64qi)__A, (__v64qi)__B,
1319 16, 64+16, 17, 64+17,
1320 18, 64+18, 19, 64+19,
1321 20, 64+20, 21, 64+21,
1322 22, 64+22, 23, 64+23,
1323 32, 64+32, 33, 64+33,
1324 34, 64+34, 35, 64+35,
1325 36, 64+36, 37, 64+37,
1326 38, 64+38, 39, 64+39,
1327 48, 64+48, 49, 64+49,
1328 50, 64+50, 51, 64+51,
1329 52, 64+52, 53, 64+53,
1330 54, 64+54, 55, 64+55);
1335 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
1342 return (__m512i)__builtin_ia32_selectb_512((
__mmask64)__U,
1349 return (__m512i)__builtin_shufflevector((__v32hi)__A, (__v32hi)__B,
1353 10, 32+10, 11, 32+11,
1354 16, 32+16, 17, 32+17,
1355 18, 32+18, 19, 32+19,
1356 24, 32+24, 25, 32+25,
1357 26, 32+26, 27, 32+27);
1362 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1369 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1379 return (__m512i)__builtin_convertvector((__v32qs)__A, __v32hi);
1385 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1393 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1401 return (__m512i)__builtin_convertvector((__v32qu)__A, __v32hi);
1407 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1415 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1421#define _mm512_shufflehi_epi16(A, imm) \
1422 ((__m512i)__builtin_ia32_pshufhw512((__v32hi)(__m512i)(A), (int)(imm)))
1424#define _mm512_mask_shufflehi_epi16(W, U, A, imm) \
1425 ((__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
1426 (__v32hi)_mm512_shufflehi_epi16((A), \
1428 (__v32hi)(__m512i)(W)))
1430#define _mm512_maskz_shufflehi_epi16(U, A, imm) \
1431 ((__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
1432 (__v32hi)_mm512_shufflehi_epi16((A), \
1434 (__v32hi)_mm512_setzero_si512()))
1436#define _mm512_shufflelo_epi16(A, imm) \
1437 ((__m512i)__builtin_ia32_pshuflw512((__v32hi)(__m512i)(A), (int)(imm)))
1440#define _mm512_mask_shufflelo_epi16(W, U, A, imm) \
1441 ((__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
1442 (__v32hi)_mm512_shufflelo_epi16((A), \
1444 (__v32hi)(__m512i)(W)))
1447#define _mm512_maskz_shufflelo_epi16(U, A, imm) \
1448 ((__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
1449 (__v32hi)_mm512_shufflelo_epi16((A), \
1451 (__v32hi)_mm512_setzero_si512()))
1456 return (__m512i)__builtin_ia32_psllv32hi((__v32hi) __A, (__v32hi) __B);
1462 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1470 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1478 return (__m512i)__builtin_ia32_psllw512((__v32hi) __A, (__v8hi) __B);
1484 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1492 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1500 return (__m512i)__builtin_ia32_psllwi512((__v32hi)__A, (
int)__B);
1507 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1515 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1520#define _mm512_bslli_epi128(a, imm) \
1521 ((__m512i)__builtin_ia32_pslldqi512_byteshift((__v8di)(__m512i)(a), (int)(imm)))
1526 return (__m512i)__builtin_ia32_psrlv32hi((__v32hi)__A, (__v32hi)__B);
1532 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1540 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1548 return (__m512i)__builtin_ia32_psrav32hi((__v32hi)__A, (__v32hi)__B);
1554 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1562 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1570 return (__m512i)__builtin_ia32_psraw512((__v32hi) __A, (__v8hi) __B);
1576 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1584 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1592 return (__m512i)__builtin_ia32_psrawi512((__v32hi)__A, (
int)__B);
1599 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1607 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1615 return (__m512i)__builtin_ia32_psrlw512((__v32hi) __A, (__v8hi) __B);
1621 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1629 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1637 return (__m512i)__builtin_ia32_psrlwi512((__v32hi)__A, (
int)__B);
1644 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1652 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__U,
1657#define _mm512_bsrli_epi128(a, imm) \
1658 ((__m512i)__builtin_ia32_psrldqi512_byteshift((__v8di)(__m512i)(a), (int)(imm)))
1663 return (__m512i) __builtin_ia32_selectw_512 ((
__mmask32) __U,
1671 return (__m512i) __builtin_ia32_selectw_512 ((
__mmask32) __U,
1679 return (__m512i) __builtin_ia32_selectb_512 ((
__mmask64) __U,
1687 return (__m512i) __builtin_ia32_selectb_512 ((
__mmask64) __U,
1695 return (__m512i) __builtin_ia32_selectb_512(__M,
1703 return (__m512i) __builtin_ia32_selectb_512(__M,
1724 struct __loadu_epi16 {
1727 return ((
const struct __loadu_epi16*)
__P)->__v;
1733 return (__m512i) __builtin_ia32_loaddquhi512_mask ((
const __v32hi *)
__P,
1741 return (__m512i) __builtin_ia32_loaddquhi512_mask ((
const __v32hi *)
__P,
1750 struct __loadu_epi8 {
1753 return ((
const struct __loadu_epi8*)
__P)->__v;
1759 return (__m512i) __builtin_ia32_loaddquqi512_mask ((
const __v64qi *)
__P,
1767 return (__m512i) __builtin_ia32_loaddquqi512_mask ((
const __v64qi *)
__P,
1776 struct __storeu_epi16 {
1779 ((
struct __storeu_epi16*)
__P)->__v = __A;
1785 __builtin_ia32_storedquhi512_mask ((__v32hi *)
__P,
1793 struct __storeu_epi8 {
1796 ((
struct __storeu_epi8*)
__P)->__v = __A;
1802 __builtin_ia32_storedquqi512_mask ((__v64qi *)
__P,
1865 return (
__mmask64) __builtin_ia32_cvtb2mask512 ((__v64qi) __A);
1871 return (
__mmask32) __builtin_ia32_cvtw2mask512 ((__v32hi) __A);
1877 return (__m512i) __builtin_ia32_cvtmask2b512 (__A);
1883 return (__m512i) __builtin_ia32_cvtmask2w512 (__A);
1889 return (__m512i)__builtin_shufflevector((__v16qi) __A, (__v16qi) __A,
1890 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1891 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1892 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1893 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0);
1899 return (__m512i)__builtin_ia32_selectb_512(__M,
1907 return (__m512i)__builtin_ia32_selectb_512(__M,
1915 return (__m512i) __builtin_ia32_selectw_512(__M,
1923 return (__m512i) __builtin_ia32_selectw_512(__M,
1931 return (__m512i)__builtin_shufflevector((__v8hi) __A, (__v8hi) __A,
1932 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1933 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0);
1939 return (__m512i)__builtin_ia32_selectw_512(__M,
1947 return (__m512i)__builtin_ia32_selectw_512(__M,
1955 return (__m512i)__builtin_ia32_permvarhi512((__v32hi)__B, (__v32hi)__A);
1962 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
1971 return (__m512i)__builtin_ia32_selectw_512((
__mmask32)__M,
1976#define _mm512_alignr_epi8(A, B, N) \
1977 ((__m512i)__builtin_ia32_palignr512((__v64qi)(__m512i)(A), \
1978 (__v64qi)(__m512i)(B), (int)(N)))
1980#define _mm512_mask_alignr_epi8(W, U, A, B, N) \
1981 ((__m512i)__builtin_ia32_selectb_512((__mmask64)(U), \
1982 (__v64qi)_mm512_alignr_epi8((A), (B), (int)(N)), \
1983 (__v64qi)(__m512i)(W)))
1985#define _mm512_maskz_alignr_epi8(U, A, B, N) \
1986 ((__m512i)__builtin_ia32_selectb_512((__mmask64)(U), \
1987 (__v64qi)_mm512_alignr_epi8((A), (B), (int)(N)), \
1988 (__v64qi)(__m512i)_mm512_setzero_si512()))
1990#define _mm512_dbsad_epu8(A, B, imm) \
1991 ((__m512i)__builtin_ia32_dbpsadbw512((__v64qi)(__m512i)(A), \
1992 (__v64qi)(__m512i)(B), (int)(imm)))
1994#define _mm512_mask_dbsad_epu8(W, U, A, B, imm) \
1995 ((__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
1996 (__v32hi)_mm512_dbsad_epu8((A), (B), (imm)), \
1997 (__v32hi)(__m512i)(W)))
1999#define _mm512_maskz_dbsad_epu8(U, A, B, imm) \
2000 ((__m512i)__builtin_ia32_selectw_512((__mmask32)(U), \
2001 (__v32hi)_mm512_dbsad_epu8((A), (B), (imm)), \
2002 (__v32hi)_mm512_setzero_si512()))
2007 return (__m512i) __builtin_ia32_psadbw512 ((__v64qi) __A,
2011#undef __DEFAULT_FN_ATTRS512
2012#undef __DEFAULT_FN_ATTRS
_Float16 __2f16 __attribute__((ext_vector_type(2)))
Zeroes the upper 128 bits (bits 255:128) of all YMM registers.
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_unpackhi_epi8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_sll_epi16(__mmask32 __U, __m512i __A, __m128i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_max_epu16(__mmask32 __M, __m512i __A, __m512i __B)
#define _mm512_cmpeq_epi16_mask(A, B)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _kortest_mask64_u8(__mmask64 __A, __mmask64 __B, unsigned char *__C)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_srlv_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_subs_epu8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_permutex2var_epi16(__mmask32 __U, __m512i __A, __m512i __I, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_madd_epi16(__mmask16 __U, __m512i __A, __m512i __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS _cvtu64_mask64(unsigned long long __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_avg_epu8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS _mm512_kunpackw(__mmask32 __A, __mmask32 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_adds_epu16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_adds_epi8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_unpackhi_epi8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_subs_epu16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_sub_epi8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_adds_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_cvtepi8_epi16(__m256i __A)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS _load_mask32(__mmask32 *__A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mullo_epi16(__m512i __A, __m512i __B)
static __inline__ __m256i __DEFAULT_FN_ATTRS512 _mm512_mask_cvtepi16_epi8(__m256i __O, __mmask32 __M, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_broadcastw_epi16(__m512i __O, __mmask32 __M, __m128i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_broadcastb_epi8(__m128i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_avg_epu16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS _kand_mask64(__mmask64 __A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_shuffle_epi8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_broadcastw_epi16(__m128i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_max_epu8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_set1_epi8(__m512i __O, __mmask64 __M, char __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_permutexvar_epi16(__m512i __W, __mmask32 __M, __m512i __A, __m512i __B)
static __inline void __DEFAULT_FN_ATTRS512 _mm512_storeu_epi8(void *__P, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask2_permutex2var_epi16(__m512i __A, __m512i __I, __mmask32 __U, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_cvtepi8_epi16(__mmask32 __U, __m256i __A)
#define _mm512_cmpeq_epi8_mask(A, B)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS _kandn_mask32(__mmask32 __A, __mmask32 __B)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _ktestc_mask32_u8(__mmask32 __A, __mmask32 __B)
static __inline__ void __DEFAULT_FN_ATTRS512 _mm512_mask_cvtsepi16_storeu_epi8(void *__P, __mmask32 __M, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_broadcastw_epi16(__mmask32 __M, __m128i __A)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _ktest_mask32_u8(__mmask32 __A, __mmask32 __B, unsigned char *__C)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_sra_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m128i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_set1_epi16(__mmask32 __M, short __A)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _ktestc_mask64_u8(__mmask64 __A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_min_epi16(__mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_packus_epi32(__m512i __W, __mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_add_epi8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_unpackhi_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_sub_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS512 _mm512_mask_test_epi8_mask(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _kortestz_mask64_u8(__mmask64 __A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_min_epu16(__m512i __W, __mmask32 __M, __m512i __A, __m512i __B)
#define __DEFAULT_FN_ATTRS512
static __inline__ __mmask32 __DEFAULT_FN_ATTRS512 _mm512_mask_testn_epi16_mask(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m256i __DEFAULT_FN_ATTRS512 _mm512_mask_cvtusepi16_epi8(__m256i __O, __mmask32 __M, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_abs_epi8(__m512i __W, __mmask64 __U, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_min_epu16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_sll_epi16(__m512i __A, __m128i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_sad_epu8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_permutexvar_epi16(__m512i __A, __m512i __B)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS _kand_mask32(__mmask32 __A, __mmask32 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_sub_epi8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_min_epu8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_adds_epu8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_sllv_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_srli_epi16(__m512i __W, __mmask32 __U, __m512i __A, unsigned int __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS512 _mm512_mask_testn_epi8_mask(__mmask64 __U, __m512i __A, __m512i __B)
#define _mm512_cmpneq_epi8_mask(A, B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_max_epi16(__m512i __W, __mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_subs_epu8(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_slli_epi16(__m512i __A, unsigned int __B)
static __inline__ __m256i __DEFAULT_FN_ATTRS512 _mm512_maskz_cvtusepi16_epi8(__mmask32 __M, __m512i __A)
#define __DEFAULT_FN_ATTRS
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mulhrs_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_sra_epi16(__m512i __A, __m128i __B)
static __inline__ void __DEFAULT_FN_ATTRS512 _mm512_mask_storeu_epi8(void *__P, __mmask64 __U, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_sub_epi16(__m512i __A, __m512i __B)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS512 _mm512_test_epi16_mask(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_mov_epi8(__m512i __W, __mmask64 __U, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_abs_epi16(__m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_min_epi8(__mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_add_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_unpacklo_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_subs_epi8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline__ void __DEFAULT_FN_ATTRS512 _mm512_mask_storeu_epi16(void *__P, __mmask32 __U, __m512i __A)
static __inline__ __m256i __DEFAULT_FN_ATTRS512 _mm512_cvtusepi16_epi8(__m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_avg_epu16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_movm_epi16(__mmask32 __A)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS _kadd_mask32(__mmask32 __A, __mmask32 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_mulhrs_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS _kor_mask64(__mmask64 __A, __mmask64 __B)
#define _mm512_cmpneq_epi16_mask(A, B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_sll_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m128i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_srli_epi16(__m512i __A, unsigned int __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_shuffle_epi8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_max_epi8(__mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_permutex2var_epi16(__m512i __A, __mmask32 __U, __m512i __I, __m512i __B)
static __inline__ unsigned long long __DEFAULT_FN_ATTRS _cvtmask64_u64(__mmask64 __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_srlv_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_packus_epi32(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_mulhi_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_movm_epi8(__mmask64 __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_loadu_epi8(__mmask64 __U, void const *__P)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_min_epi16(__m512i __W, __mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_abs_epi8(__m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mulhi_epu16(__m512i __A, __m512i __B)
static __inline__ __m256i __DEFAULT_FN_ATTRS512 _mm512_cvtsepi16_epi8(__m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_madd_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_set1_epi8(__mmask64 __M, char __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_mulhi_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_permutexvar_epi16(__mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_add_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_adds_epi8(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_sub_epi8(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS512 _mm512_movepi8_mask(__m512i __A)
static __inline void __DEFAULT_FN_ATTRS512 _mm512_storeu_epi16(void *__P, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_maddubs_epi16(__m512i __W, __mmask32 __U, __m512i __X, __m512i __Y)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_srai_epi16(__m512i __A, unsigned int __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_max_epi8(__m512i __W, __mmask64 __M, __m512i __A, __m512i __B)
static __inline__ void __DEFAULT_FN_ATTRS _store_mask64(__mmask64 *__A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_min_epu8(__mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS _kandn_mask64(__mmask64 __A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_adds_epu8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_permutex2var_epi16(__m512i __A, __m512i __I, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_adds_epu16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_srlv_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_min_epu8(__m512i __W, __mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_packs_epi32(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_packus_epi16(__mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_loadu_epi16(__m512i __W, __mmask32 __U, void const *__P)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_max_epu16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_min_epu16(__mmask32 __M, __m512i __A, __m512i __B)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _kortestc_mask64_u8(__mmask64 __A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_cvtepi8_epi16(__m512i __W, __mmask32 __U, __m256i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_unpacklo_epi8(__mmask64 __U, __m512i __A, __m512i __B)
unsigned long long __mmask64
static __inline __m512i __DEFAULT_FN_ATTRS512 _mm512_loadu_epi8(void const *__P)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_unpackhi_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_subs_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_mulhi_epu16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_avg_epu16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_subs_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS _mm512_kunpackd(__mmask64 __A, __mmask64 __B)
static __inline__ void __DEFAULT_FN_ATTRS _store_mask32(__mmask32 *__A, __mmask32 __B)
#define _mm512_mask_cmpeq_epi8_mask(k, A, B)
#define _mm512_mask_cmpneq_epi16_mask(k, A, B)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS512 _mm512_testn_epi16_mask(__m512i __A, __m512i __B)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _ktestz_mask32_u8(__mmask32 __A, __mmask32 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_sllv_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maddubs_epi16(__m512i __X, __m512i __Y)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_subs_epu16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS _kxor_mask32(__mmask32 __A, __mmask32 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mulhi_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_subs_epu8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_srav_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_srli_epi16(__mmask32 __U, __m512i __A, int __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_srl_epi16(__mmask32 __U, __m512i __A, __m128i __B)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS _kor_mask32(__mmask32 __A, __mmask32 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_packs_epi32(__m512i __W, __mmask32 __M, __m512i __A, __m512i __B)
static __inline __m512i __DEFAULT_FN_ATTRS512 _mm512_loadu_epi16(void const *__P)
static __inline__ __m256i __DEFAULT_FN_ATTRS512 _mm512_mask_cvtsepi16_epi8(__m256i __O, __mmask32 __M, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_unpackhi_epi8(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_mullo_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_srai_epi16(__mmask32 __U, __m512i __A, unsigned int __B)
static __inline __mmask32 __DEFAULT_FN_ATTRS _knot_mask32(__mmask32 __M)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_mulhrs_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_loadu_epi8(__m512i __W, __mmask64 __U, void const *__P)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_subs_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_srl_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m128i __B)
static __inline__ __m256i __DEFAULT_FN_ATTRS512 _mm512_maskz_cvtsepi16_epi8(__mmask32 __M, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_maddubs_epi16(__mmask32 __U, __m512i __X, __m512i __Y)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _ktestz_mask64_u8(__mmask64 __A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_adds_epu16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_packus_epi16(__m512i __W, __mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_max_epi8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_packs_epi32(__mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_unpacklo_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS _kxor_mask64(__mmask64 __A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_broadcastb_epi8(__m512i __O, __mmask64 __M, __m128i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_slli_epi16(__mmask32 __U, __m512i __A, unsigned int __B)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS512 _mm512_mask_test_epi16_mask(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_avg_epu8(__m512i __A, __m512i __B)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS _cvtu32_mask32(unsigned int __A)
static __inline__ __m256i __DEFAULT_FN_ATTRS512 _mm512_maskz_cvtepi16_epi8(__mmask32 __M, __m512i __A)
static __inline__ void __DEFAULT_FN_ATTRS512 _mm512_mask_cvtusepi16_storeu_epi8(void *__P, __mmask32 __M, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_sra_epi16(__mmask32 __U, __m512i __A, __m128i __B)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _ktest_mask64_u8(__mmask64 __A, __mmask64 __B, unsigned char *__C)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_subs_epi8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_max_epu16(__m512i __W, __mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_packus_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_max_epu8(__m512i __W, __mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_unpackhi_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_sub_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS _load_mask64(__mmask64 *__A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_broadcastb_epi8(__mmask64 __M, __m128i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_sllv_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m256i __DEFAULT_FN_ATTRS512 _mm512_cvtepi16_epi8(__m512i __A)
#define _mm512_mask_cmpeq_epi16_mask(k, A, B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_min_epi8(__m512i __W, __mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_abs_epi8(__mmask64 __U, __m512i __A)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS _kxnor_mask32(__mmask32 __A, __mmask32 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_set1_epi16(__m512i __O, __mmask32 __M, short __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_blend_epi16(__mmask32 __U, __m512i __A, __m512i __W)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_subs_epu16(__m512i __A, __m512i __B)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _kortestc_mask32_u8(__mmask32 __A, __mmask32 __B)
#define _mm512_mask_cmpneq_epi8_mask(k, A, B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_subs_epi8(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_shuffle_epi8(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS _kadd_mask64(__mmask64 __A, __mmask64 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_loadu_epi16(__mmask32 __U, void const *__P)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_cvtepu8_epi16(__m512i __W, __mmask32 __U, __m256i __A)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS512 _mm512_testn_epi8_mask(__m512i __A, __m512i __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS512 _mm512_test_epi8_mask(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_packs_epi16(__m512i __W, __mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_unpacklo_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_abs_epi16(__m512i __W, __mmask32 __U, __m512i __A)
static __inline__ __mmask32 __DEFAULT_FN_ATTRS512 _mm512_movepi16_mask(__m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_add_epi8(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_packus_epi32(__mmask32 __M, __m512i __A, __m512i __B)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _kortest_mask32_u8(__mmask32 __A, __mmask32 __B, unsigned char *__C)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_adds_epu8(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_min_epi16(__m512i __A, __m512i __B)
static __inline__ __mmask64 __DEFAULT_FN_ATTRS _kxnor_mask64(__mmask64 __A, __mmask64 __B)
static __inline__ unsigned int __DEFAULT_FN_ATTRS _cvtmask32_u32(__mmask32 __A)
static __inline__ unsigned char __DEFAULT_FN_ATTRS _kortestz_mask32_u8(__mmask32 __A, __mmask32 __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_adds_epi8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_blend_epi8(__mmask64 __U, __m512i __A, __m512i __W)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_max_epi16(__mmask32 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_srl_epi16(__m512i __A, __m128i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_max_epu8(__mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_mullo_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_unpacklo_epi8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_adds_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_unpacklo_epi8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_slli_epi16(__m512i __W, __mmask32 __U, __m512i __A, unsigned int __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_packs_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_mov_epi16(__m512i __W, __mmask32 __U, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_add_epi8(__m512i __W, __mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_cvtepu8_epi16(__mmask32 __U, __m256i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_min_epi8(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_mulhi_epu16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_adds_epi16(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_cvtepu8_epi16(__m256i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_srai_epi16(__m512i __W, __mmask32 __U, __m512i __A, unsigned int __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_add_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_srav_epi16(__mmask32 __U, __m512i __A, __m512i __B)
static __inline __mmask64 __DEFAULT_FN_ATTRS _knot_mask64(__mmask64 __M)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_madd_epi16(__m512i __W, __mmask16 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_avg_epu8(__mmask64 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_max_epi16(__m512i __A, __m512i __B)
static __inline__ void __DEFAULT_FN_ATTRS512 _mm512_mask_cvtepi16_storeu_epi8(void *__P, __mmask32 __M, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_packs_epi16(__mmask64 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_mov_epi16(__mmask32 __U, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_mask_srav_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_mov_epi8(__mmask64 __U, __m512i __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_maskz_abs_epi16(__mmask32 __U, __m512i __A)
static __inline __m512i __DEFAULT_FN_ATTRS512 _mm512_set1_epi16(short __w)
static __inline __m512i __DEFAULT_FN_ATTRS512 _mm512_set1_epi8(char __w)
static __inline__ __m512i __DEFAULT_FN_ATTRS512 _mm512_and_epi32(__m512i __a, __m512i __b)
static __inline __m512i __DEFAULT_FN_ATTRS512 _mm512_setzero_si512(void)
static __inline__ __m256i __DEFAULT_FN_ATTRS _mm256_undefined_si256(void)
Create a 256-bit integer vector with undefined values.
static __inline __m256i __DEFAULT_FN_ATTRS _mm256_setzero_si256(void)
Constructs a 256-bit integer vector initialized to zero.
struct __storeu_i16 *__P __v
__inline unsigned int unsigned int unsigned int * __P
__inline unsigned int unsigned int __Y