clang 18.0.0git
|
Go to the source code of this file.
Macros | |
#define | __DEFAULT_FN_ATTRS256 |
#define | __DEFAULT_FN_ATTRS128 |
Functions | |
static __inline__ __m128i __DEFAULT_FN_ATTRS128 | _mm_dpbssd_epi32 (__m128i __W, __m128i __A, __m128i __B) |
Multiply groups of 4 adjacent pairs of signed 8-bit integers in __A with corresponding signed 8-bit integers in __B, producing 4 intermediate signed 16-bit results. | |
static __inline__ __m256i __DEFAULT_FN_ATTRS256 | _mm256_dpbssd_epi32 (__m256i __W, __m256i __A, __m256i __B) |
Multiply groups of 4 adjacent pairs of signed 8-bit integers in __A with corresponding signed 8-bit integers in __B, producing 4 intermediate signed 16-bit results. | |
static __inline__ __m128i __DEFAULT_FN_ATTRS128 | _mm_dpbssds_epi32 (__m128i __W, __m128i __A, __m128i __B) |
Multiply groups of 4 adjacent pairs of signed 8-bit integers in __A with corresponding signed 8-bit integers in __B, producing 4 intermediate signed 16-bit results. | |
static __inline__ __m256i __DEFAULT_FN_ATTRS256 | _mm256_dpbssds_epi32 (__m256i __W, __m256i __A, __m256i __B) |
Multiply groups of 4 adjacent pairs of signed 8-bit integers in __A with corresponding signed 8-bit integers in __B, producing 4 intermediate signed 16-bit results. | |
static __inline__ __m128i __DEFAULT_FN_ATTRS128 | _mm_dpbsud_epi32 (__m128i __W, __m128i __A, __m128i __B) |
Multiply groups of 4 adjacent pairs of signed 8-bit integers in __A with corresponding unsigned 8-bit integers in __B, producing 4 intermediate signed 16-bit results. | |
static __inline__ __m256i __DEFAULT_FN_ATTRS256 | _mm256_dpbsud_epi32 (__m256i __W, __m256i __A, __m256i __B) |
Multiply groups of 4 adjacent pairs of signed 8-bit integers in __A with corresponding unsigned 8-bit integers in __B, producing 4 intermediate signed 16-bit results. | |
static __inline__ __m128i __DEFAULT_FN_ATTRS128 | _mm_dpbsuds_epi32 (__m128i __W, __m128i __A, __m128i __B) |
Multiply groups of 4 adjacent pairs of signed 8-bit integers in __A with corresponding unsigned 8-bit integers in __B, producing 4 intermediate signed 16-bit results. | |
static __inline__ __m256i __DEFAULT_FN_ATTRS256 | _mm256_dpbsuds_epi32 (__m256i __W, __m256i __A, __m256i __B) |
Multiply groups of 4 adjacent pairs of signed 8-bit integers in __A with corresponding unsigned 8-bit integers in __B, producing 4 intermediate signed 16-bit results. | |
static __inline__ __m128i __DEFAULT_FN_ATTRS128 | _mm_dpbuud_epi32 (__m128i __W, __m128i __A, __m128i __B) |
Multiply groups of 4 adjacent pairs of unsigned 8-bit integers in __A with corresponding unsigned 8-bit integers in __B, producing 4 intermediate signed 16-bit results. | |
static __inline__ __m256i __DEFAULT_FN_ATTRS256 | _mm256_dpbuud_epi32 (__m256i __W, __m256i __A, __m256i __B) |
Multiply groups of 4 adjacent pairs of unsigned 8-bit integers in __A with corresponding unsigned 8-bit integers in __B, producing 4 intermediate signed 16-bit results. | |
static __inline__ __m128i __DEFAULT_FN_ATTRS128 | _mm_dpbuuds_epi32 (__m128i __W, __m128i __A, __m128i __B) |
Multiply groups of 4 adjacent pairs of unsigned 8-bit integers in __A with corresponding unsigned 8-bit integers in __B, producing 4 intermediate signed 16-bit results. | |
static __inline__ __m256i __DEFAULT_FN_ATTRS256 | _mm256_dpbuuds_epi32 (__m256i __W, __m256i __A, __m256i __B) |
Multiply groups of 4 adjacent pairs of signed 8-bit integers in __A with corresponding unsigned 8-bit integers in __B, producing 4 intermediate signed 16-bit results. | |
#define __DEFAULT_FN_ATTRS128 |
Definition at line 21 of file avxvnniint8intrin.h.
#define __DEFAULT_FN_ATTRS256 |
Definition at line 18 of file avxvnniint8intrin.h.
|
static |
Multiply groups of 4 adjacent pairs of signed 8-bit integers in __A with corresponding signed 8-bit integers in __B, producing 4 intermediate signed 16-bit results.
Sum these 4 results with the corresponding 32-bit integer in __W, and store the packed 32-bit results in dst.
This intrinsic corresponds to the VPDPBSSD
instruction.
__A | A 256-bit vector of [32 x char]. |
__B | A 256-bit vector of [32 x char]. |
Definition at line 93 of file avxvnniint8intrin.h.
|
static |
Multiply groups of 4 adjacent pairs of signed 8-bit integers in __A with corresponding signed 8-bit integers in __B, producing 4 intermediate signed 16-bit results.
Sum these 4 results with the corresponding 32-bit integer in __W with signed saturation, and store the packed 32-bit results in dst.
This intrinsic corresponds to the VPDPBSSD
instruction.
__A | A 256-bit vector of [32 x char]. |
__B | A 256-bit vector of [32 x char]. |
Definition at line 168 of file avxvnniint8intrin.h.
|
static |
Multiply groups of 4 adjacent pairs of signed 8-bit integers in __A with corresponding unsigned 8-bit integers in __B, producing 4 intermediate signed 16-bit results.
Sum these 4 results with the corresponding 32-bit integer in __W, and store the packed 32-bit results in dst.
This intrinsic corresponds to the VPDPBSSD
instruction.
__A | A 256-bit vector of [32 x char]. |
__B | A 256-bit vector of [32 x unsigned char]. |
Definition at line 241 of file avxvnniint8intrin.h.
|
static |
Multiply groups of 4 adjacent pairs of signed 8-bit integers in __A with corresponding unsigned 8-bit integers in __B, producing 4 intermediate signed 16-bit results.
Sum these 4 results with the corresponding 32-bit integer in __W with signed saturation, and store the packed 32-bit results in dst.
This intrinsic corresponds to the VPDPBSSD
instruction.
__A | A 256-bit vector of [32 x char]. |
__B | A 256-bit vector of [32 x unsigned char]. |
Definition at line 316 of file avxvnniint8intrin.h.
|
static |
Multiply groups of 4 adjacent pairs of unsigned 8-bit integers in __A with corresponding unsigned 8-bit integers in __B, producing 4 intermediate signed 16-bit results.
Sum these 4 results with the corresponding 32-bit integer in __W, and store the packed 32-bit results in dst.
This intrinsic corresponds to the VPDPBSSD
instruction.
__A | A 256-bit vector of [32 x unsigned char]. |
__B | A 256-bit vector of [32 x unsigned char]. |
Definition at line 389 of file avxvnniint8intrin.h.
|
static |
Multiply groups of 4 adjacent pairs of signed 8-bit integers in __A with corresponding unsigned 8-bit integers in __B, producing 4 intermediate signed 16-bit results.
Sum these 4 results with the corresponding 32-bit integer in __W with signed saturation, and store the packed 32-bit results in dst.
This intrinsic corresponds to the VPDPBUUDS
instruction.
__A | A 256-bit vector of [32 x unsigned char]. |
__B | A 256-bit vector of [32 x unsigned char]. |
Definition at line 464 of file avxvnniint8intrin.h.
|
static |
Multiply groups of 4 adjacent pairs of signed 8-bit integers in __A with corresponding signed 8-bit integers in __B, producing 4 intermediate signed 16-bit results.
Sum these 4 results with the corresponding 32-bit integer in __W, and store the packed 32-bit results in dst.
This intrinsic corresponds to the VPDPBSSD
instruction.
__A | A 128-bit vector of [16 x char]. |
__B | A 128-bit vector of [16 x char]. |
Definition at line 55 of file avxvnniint8intrin.h.
|
static |
Multiply groups of 4 adjacent pairs of signed 8-bit integers in __A with corresponding signed 8-bit integers in __B, producing 4 intermediate signed 16-bit results.
Sum these 4 results with the corresponding 32-bit integer in __W with signed saturation, and store the packed 32-bit results in dst.
This intrinsic corresponds to the VPDPBSSD
instruction.
__A | A 128-bit vector of [16 x char]. |
__B | A 128-bit vector of [16 x char]. |
Definition at line 129 of file avxvnniint8intrin.h.
|
static |
Multiply groups of 4 adjacent pairs of signed 8-bit integers in __A with corresponding unsigned 8-bit integers in __B, producing 4 intermediate signed 16-bit results.
Sum these 4 results with the corresponding 32-bit integer in __W, and store the packed 32-bit results in dst.
This intrinsic corresponds to the VPDPBSSD
instruction.
__A | A 128-bit vector of [16 x char]. |
__B | A 128-bit vector of [16 x unsigned char]. |
Definition at line 203 of file avxvnniint8intrin.h.
|
static |
Multiply groups of 4 adjacent pairs of signed 8-bit integers in __A with corresponding unsigned 8-bit integers in __B, producing 4 intermediate signed 16-bit results.
Sum these 4 results with the corresponding 32-bit integer in __W with signed saturation, and store the packed 32-bit results in dst.
This intrinsic corresponds to the VPDPBSSD
instruction.
__A | A 128-bit vector of [16 x char]. |
__B | A 128-bit vector of [16 x unsigned char]. |
Definition at line 277 of file avxvnniint8intrin.h.
|
static |
Multiply groups of 4 adjacent pairs of unsigned 8-bit integers in __A with corresponding unsigned 8-bit integers in __B, producing 4 intermediate signed 16-bit results.
Sum these 4 results with the corresponding 32-bit integer in __W, and store the packed 32-bit results in dst.
This intrinsic corresponds to the VPDPBSSD
instruction.
__A | A 128-bit vector of [16 x unsigned char]. |
__B | A 128-bit vector of [16 x unsigned char]. |
Definition at line 351 of file avxvnniint8intrin.h.
|
static |
Multiply groups of 4 adjacent pairs of unsigned 8-bit integers in __A with corresponding unsigned 8-bit integers in __B, producing 4 intermediate signed 16-bit results.
Sum these 4 results with the corresponding 32-bit integer in __W with signed saturation, and store the packed 32-bit results in dst.
This intrinsic corresponds to the VPDPBUUDS
instruction.
__A | A 128-bit vector of [16 x unsigned char]. |
__B | A 128-bit vector of [16 x unsigned char]. |
Definition at line 425 of file avxvnniint8intrin.h.