4186 uint32_t BuiltinID) {
4191 switch (BuiltinID) {
4192 case Builtin::BI__builtin_is_constant_evaluated:
4195 case Builtin::BI__builtin_assume:
4196 case Builtin::BI__assume:
4199 case Builtin::BI__builtin_strcmp:
4200 case Builtin::BIstrcmp:
4201 case Builtin::BI__builtin_strncmp:
4202 case Builtin::BIstrncmp:
4203 case Builtin::BI__builtin_wcsncmp:
4204 case Builtin::BIwcsncmp:
4205 case Builtin::BI__builtin_wcscmp:
4206 case Builtin::BIwcscmp:
4209 case Builtin::BI__builtin_strlen:
4210 case Builtin::BIstrlen:
4211 case Builtin::BI__builtin_wcslen:
4212 case Builtin::BIwcslen:
4215 case Builtin::BI__builtin_nan:
4216 case Builtin::BI__builtin_nanf:
4217 case Builtin::BI__builtin_nanl:
4218 case Builtin::BI__builtin_nanf16:
4219 case Builtin::BI__builtin_nanf128:
4222 case Builtin::BI__builtin_nans:
4223 case Builtin::BI__builtin_nansf:
4224 case Builtin::BI__builtin_nansl:
4225 case Builtin::BI__builtin_nansf16:
4226 case Builtin::BI__builtin_nansf128:
4229 case Builtin::BI__builtin_huge_val:
4230 case Builtin::BI__builtin_huge_valf:
4231 case Builtin::BI__builtin_huge_vall:
4232 case Builtin::BI__builtin_huge_valf16:
4233 case Builtin::BI__builtin_huge_valf128:
4234 case Builtin::BI__builtin_inf:
4235 case Builtin::BI__builtin_inff:
4236 case Builtin::BI__builtin_infl:
4237 case Builtin::BI__builtin_inff16:
4238 case Builtin::BI__builtin_inff128:
4241 case Builtin::BI__builtin_copysign:
4242 case Builtin::BI__builtin_copysignf:
4243 case Builtin::BI__builtin_copysignl:
4244 case Builtin::BI__builtin_copysignf128:
4247 case Builtin::BI__builtin_fmin:
4248 case Builtin::BI__builtin_fminf:
4249 case Builtin::BI__builtin_fminl:
4250 case Builtin::BI__builtin_fminf16:
4251 case Builtin::BI__builtin_fminf128:
4254 case Builtin::BI__builtin_fminimum_num:
4255 case Builtin::BI__builtin_fminimum_numf:
4256 case Builtin::BI__builtin_fminimum_numl:
4257 case Builtin::BI__builtin_fminimum_numf16:
4258 case Builtin::BI__builtin_fminimum_numf128:
4261 case Builtin::BI__builtin_fmax:
4262 case Builtin::BI__builtin_fmaxf:
4263 case Builtin::BI__builtin_fmaxl:
4264 case Builtin::BI__builtin_fmaxf16:
4265 case Builtin::BI__builtin_fmaxf128:
4268 case Builtin::BI__builtin_fmaximum_num:
4269 case Builtin::BI__builtin_fmaximum_numf:
4270 case Builtin::BI__builtin_fmaximum_numl:
4271 case Builtin::BI__builtin_fmaximum_numf16:
4272 case Builtin::BI__builtin_fmaximum_numf128:
4275 case Builtin::BI__builtin_isnan:
4278 case Builtin::BI__builtin_issignaling:
4281 case Builtin::BI__builtin_isinf:
4284 case Builtin::BI__builtin_isinf_sign:
4287 case Builtin::BI__builtin_isfinite:
4290 case Builtin::BI__builtin_isnormal:
4293 case Builtin::BI__builtin_issubnormal:
4296 case Builtin::BI__builtin_iszero:
4299 case Builtin::BI__builtin_signbit:
4300 case Builtin::BI__builtin_signbitf:
4301 case Builtin::BI__builtin_signbitl:
4304 case Builtin::BI__builtin_isgreater:
4305 case Builtin::BI__builtin_isgreaterequal:
4306 case Builtin::BI__builtin_isless:
4307 case Builtin::BI__builtin_islessequal:
4308 case Builtin::BI__builtin_islessgreater:
4309 case Builtin::BI__builtin_isunordered:
4312 case Builtin::BI__builtin_isfpclass:
4315 case Builtin::BI__builtin_fpclassify:
4318 case Builtin::BI__builtin_fabs:
4319 case Builtin::BI__builtin_fabsf:
4320 case Builtin::BI__builtin_fabsl:
4321 case Builtin::BI__builtin_fabsf128:
4324 case Builtin::BI__builtin_abs:
4325 case Builtin::BI__builtin_labs:
4326 case Builtin::BI__builtin_llabs:
4329 case Builtin::BI__builtin_popcount:
4330 case Builtin::BI__builtin_popcountl:
4331 case Builtin::BI__builtin_popcountll:
4332 case Builtin::BI__builtin_popcountg:
4333 case Builtin::BI__popcnt16:
4334 case Builtin::BI__popcnt:
4335 case Builtin::BI__popcnt64:
4338 case Builtin::BI__builtin_parity:
4339 case Builtin::BI__builtin_parityl:
4340 case Builtin::BI__builtin_parityll:
4343 return APInt(Val.getBitWidth(), Val.popcount() % 2);
4345 case Builtin::BI__builtin_clrsb:
4346 case Builtin::BI__builtin_clrsbl:
4347 case Builtin::BI__builtin_clrsbll:
4350 return APInt(Val.getBitWidth(),
4351 Val.getBitWidth() - Val.getSignificantBits());
4353 case Builtin::BI__builtin_bitreverseg:
4354 case Builtin::BI__builtin_bitreverse8:
4355 case Builtin::BI__builtin_bitreverse16:
4356 case Builtin::BI__builtin_bitreverse32:
4357 case Builtin::BI__builtin_bitreverse64:
4359 S, OpPC,
Call, [](
const APSInt &Val) {
return Val.reverseBits(); });
4361 case Builtin::BI__builtin_classify_type:
4364 case Builtin::BI__builtin_expect:
4365 case Builtin::BI__builtin_expect_with_probability:
4368 case Builtin::BI__builtin_rotateleft8:
4369 case Builtin::BI__builtin_rotateleft16:
4370 case Builtin::BI__builtin_rotateleft32:
4371 case Builtin::BI__builtin_rotateleft64:
4372 case Builtin::BI__builtin_stdc_rotate_left:
4373 case Builtin::BI_rotl8:
4374 case Builtin::BI_rotl16:
4375 case Builtin::BI_rotl:
4376 case Builtin::BI_lrotl:
4377 case Builtin::BI_rotl64:
4378 case Builtin::BI__builtin_rotateright8:
4379 case Builtin::BI__builtin_rotateright16:
4380 case Builtin::BI__builtin_rotateright32:
4381 case Builtin::BI__builtin_rotateright64:
4382 case Builtin::BI__builtin_stdc_rotate_right:
4383 case Builtin::BI_rotr8:
4384 case Builtin::BI_rotr16:
4385 case Builtin::BI_rotr:
4386 case Builtin::BI_lrotr:
4387 case Builtin::BI_rotr64: {
4390 switch (BuiltinID) {
4391 case Builtin::BI__builtin_rotateright8:
4392 case Builtin::BI__builtin_rotateright16:
4393 case Builtin::BI__builtin_rotateright32:
4394 case Builtin::BI__builtin_rotateright64:
4395 case Builtin::BI__builtin_stdc_rotate_right:
4396 case Builtin::BI_rotr8:
4397 case Builtin::BI_rotr16:
4398 case Builtin::BI_rotr:
4399 case Builtin::BI_lrotr:
4400 case Builtin::BI_rotr64:
4401 IsRotateRight =
true;
4404 IsRotateRight =
false;
4411 return IsRotateRight ?
Value.rotr(Amount.getZExtValue())
4412 :
Value.rotl(Amount.getZExtValue());
4416 case Builtin::BI__builtin_ffs:
4417 case Builtin::BI__builtin_ffsl:
4418 case Builtin::BI__builtin_ffsll:
4421 return APInt(Val.getBitWidth(),
4422 Val.isZero() ? 0u : Val.countTrailingZeros() + 1u);
4425 case Builtin::BIaddressof:
4426 case Builtin::BI__addressof:
4427 case Builtin::BI__builtin_addressof:
4431 case Builtin::BIas_const:
4432 case Builtin::BIforward:
4433 case Builtin::BIforward_like:
4434 case Builtin::BImove:
4435 case Builtin::BImove_if_noexcept:
4439 case Builtin::BI__builtin_eh_return_data_regno:
4442 case Builtin::BI__builtin_launder:
4446 case Builtin::BI__builtin_add_overflow:
4447 case Builtin::BI__builtin_sub_overflow:
4448 case Builtin::BI__builtin_mul_overflow:
4449 case Builtin::BI__builtin_sadd_overflow:
4450 case Builtin::BI__builtin_uadd_overflow:
4451 case Builtin::BI__builtin_uaddl_overflow:
4452 case Builtin::BI__builtin_uaddll_overflow:
4453 case Builtin::BI__builtin_usub_overflow:
4454 case Builtin::BI__builtin_usubl_overflow:
4455 case Builtin::BI__builtin_usubll_overflow:
4456 case Builtin::BI__builtin_umul_overflow:
4457 case Builtin::BI__builtin_umull_overflow:
4458 case Builtin::BI__builtin_umulll_overflow:
4459 case Builtin::BI__builtin_saddl_overflow:
4460 case Builtin::BI__builtin_saddll_overflow:
4461 case Builtin::BI__builtin_ssub_overflow:
4462 case Builtin::BI__builtin_ssubl_overflow:
4463 case Builtin::BI__builtin_ssubll_overflow:
4464 case Builtin::BI__builtin_smul_overflow:
4465 case Builtin::BI__builtin_smull_overflow:
4466 case Builtin::BI__builtin_smulll_overflow:
4469 case Builtin::BI__builtin_addcb:
4470 case Builtin::BI__builtin_addcs:
4471 case Builtin::BI__builtin_addc:
4472 case Builtin::BI__builtin_addcl:
4473 case Builtin::BI__builtin_addcll:
4474 case Builtin::BI__builtin_subcb:
4475 case Builtin::BI__builtin_subcs:
4476 case Builtin::BI__builtin_subc:
4477 case Builtin::BI__builtin_subcl:
4478 case Builtin::BI__builtin_subcll:
4481 case Builtin::BI__builtin_clz:
4482 case Builtin::BI__builtin_clzl:
4483 case Builtin::BI__builtin_clzll:
4484 case Builtin::BI__builtin_clzs:
4485 case Builtin::BI__builtin_clzg:
4486 case Builtin::BI__lzcnt16:
4487 case Builtin::BI__lzcnt:
4488 case Builtin::BI__lzcnt64:
4491 case Builtin::BI__builtin_ctz:
4492 case Builtin::BI__builtin_ctzl:
4493 case Builtin::BI__builtin_ctzll:
4494 case Builtin::BI__builtin_ctzs:
4495 case Builtin::BI__builtin_ctzg:
4498 case Builtin::BI__builtin_elementwise_clzg:
4499 case Builtin::BI__builtin_elementwise_ctzg:
4502 case Builtin::BI__builtin_bswapg:
4503 case Builtin::BI__builtin_bswap16:
4504 case Builtin::BI__builtin_bswap32:
4505 case Builtin::BI__builtin_bswap64:
4508 case Builtin::BI__atomic_always_lock_free:
4509 case Builtin::BI__atomic_is_lock_free:
4512 case Builtin::BI__c11_atomic_is_lock_free:
4515 case Builtin::BI__builtin_complex:
4518 case Builtin::BI__builtin_is_aligned:
4519 case Builtin::BI__builtin_align_up:
4520 case Builtin::BI__builtin_align_down:
4523 case Builtin::BI__builtin_assume_aligned:
4526 case clang::X86::BI__builtin_ia32_crc32qi:
4528 case clang::X86::BI__builtin_ia32_crc32hi:
4530 case clang::X86::BI__builtin_ia32_crc32si:
4532 case clang::X86::BI__builtin_ia32_crc32di:
4535 case clang::X86::BI__builtin_ia32_bextr_u32:
4536 case clang::X86::BI__builtin_ia32_bextr_u64:
4537 case clang::X86::BI__builtin_ia32_bextri_u32:
4538 case clang::X86::BI__builtin_ia32_bextri_u64:
4541 unsigned BitWidth = Val.getBitWidth();
4542 uint64_t Shift = Idx.extractBitsAsZExtValue(8, 0);
4543 uint64_t Length = Idx.extractBitsAsZExtValue(8, 8);
4544 if (Length > BitWidth) {
4549 if (Length == 0 || Shift >= BitWidth)
4550 return APInt(BitWidth, 0);
4552 uint64_t
Result = Val.getZExtValue() >> Shift;
4553 Result &= llvm::maskTrailingOnes<uint64_t>(Length);
4557 case clang::X86::BI__builtin_ia32_bzhi_si:
4558 case clang::X86::BI__builtin_ia32_bzhi_di:
4561 unsigned BitWidth = Val.getBitWidth();
4562 uint64_t Index = Idx.extractBitsAsZExtValue(8, 0);
4565 if (Index < BitWidth)
4566 Result.clearHighBits(BitWidth - Index);
4571 case clang::X86::BI__builtin_ia32_ktestcqi:
4572 case clang::X86::BI__builtin_ia32_ktestchi:
4573 case clang::X86::BI__builtin_ia32_ktestcsi:
4574 case clang::X86::BI__builtin_ia32_ktestcdi:
4577 return APInt(
sizeof(
unsigned char) * 8, (~A & B) == 0);
4580 case clang::X86::BI__builtin_ia32_ktestzqi:
4581 case clang::X86::BI__builtin_ia32_ktestzhi:
4582 case clang::X86::BI__builtin_ia32_ktestzsi:
4583 case clang::X86::BI__builtin_ia32_ktestzdi:
4586 return APInt(
sizeof(
unsigned char) * 8, (A & B) == 0);
4589 case clang::X86::BI__builtin_ia32_kortestcqi:
4590 case clang::X86::BI__builtin_ia32_kortestchi:
4591 case clang::X86::BI__builtin_ia32_kortestcsi:
4592 case clang::X86::BI__builtin_ia32_kortestcdi:
4595 return APInt(
sizeof(
unsigned char) * 8, ~(A | B) == 0);
4598 case clang::X86::BI__builtin_ia32_kortestzqi:
4599 case clang::X86::BI__builtin_ia32_kortestzhi:
4600 case clang::X86::BI__builtin_ia32_kortestzsi:
4601 case clang::X86::BI__builtin_ia32_kortestzdi:
4604 return APInt(
sizeof(
unsigned char) * 8, (A | B) == 0);
4607 case clang::X86::BI__builtin_ia32_kshiftliqi:
4608 case clang::X86::BI__builtin_ia32_kshiftlihi:
4609 case clang::X86::BI__builtin_ia32_kshiftlisi:
4610 case clang::X86::BI__builtin_ia32_kshiftlidi:
4613 unsigned Amt = RHS.getZExtValue() & 0xFF;
4614 if (Amt >= LHS.getBitWidth())
4615 return APInt::getZero(LHS.getBitWidth());
4616 return LHS.shl(Amt);
4619 case clang::X86::BI__builtin_ia32_kshiftriqi:
4620 case clang::X86::BI__builtin_ia32_kshiftrihi:
4621 case clang::X86::BI__builtin_ia32_kshiftrisi:
4622 case clang::X86::BI__builtin_ia32_kshiftridi:
4625 unsigned Amt = RHS.getZExtValue() & 0xFF;
4626 if (Amt >= LHS.getBitWidth())
4627 return APInt::getZero(LHS.getBitWidth());
4628 return LHS.lshr(Amt);
4631 case clang::X86::BI__builtin_ia32_lzcnt_u16:
4632 case clang::X86::BI__builtin_ia32_lzcnt_u32:
4633 case clang::X86::BI__builtin_ia32_lzcnt_u64:
4636 return APInt(Src.getBitWidth(), Src.countLeadingZeros());
4639 case clang::X86::BI__builtin_ia32_tzcnt_u16:
4640 case clang::X86::BI__builtin_ia32_tzcnt_u32:
4641 case clang::X86::BI__builtin_ia32_tzcnt_u64:
4644 return APInt(Src.getBitWidth(), Src.countTrailingZeros());
4647 case clang::X86::BI__builtin_ia32_pdep_si:
4648 case clang::X86::BI__builtin_ia32_pdep_di:
4651 unsigned BitWidth = Val.getBitWidth();
4654 for (
unsigned I = 0, P = 0; I != BitWidth; ++I) {
4656 Result.setBitVal(I, Val[P++]);
4662 case clang::X86::BI__builtin_ia32_pext_si:
4663 case clang::X86::BI__builtin_ia32_pext_di:
4666 unsigned BitWidth = Val.getBitWidth();
4669 for (
unsigned I = 0, P = 0; I != BitWidth; ++I) {
4671 Result.setBitVal(P++, Val[I]);
4677 case clang::X86::BI__builtin_ia32_addcarryx_u32:
4678 case clang::X86::BI__builtin_ia32_addcarryx_u64:
4679 case clang::X86::BI__builtin_ia32_subborrow_u32:
4680 case clang::X86::BI__builtin_ia32_subborrow_u64:
4684 case Builtin::BI__builtin_os_log_format_buffer_size:
4687 case Builtin::BI__builtin_ptrauth_string_discriminator:
4690 case Builtin::BI__builtin_infer_alloc_token:
4693 case Builtin::BI__noop:
4697 case Builtin::BI__builtin_operator_new:
4700 case Builtin::BI__builtin_operator_delete:
4703 case Builtin::BI__arithmetic_fence:
4706 case Builtin::BI__builtin_reduce_add:
4707 case Builtin::BI__builtin_reduce_mul:
4708 case Builtin::BI__builtin_reduce_and:
4709 case Builtin::BI__builtin_reduce_or:
4710 case Builtin::BI__builtin_reduce_xor:
4711 case Builtin::BI__builtin_reduce_min:
4712 case Builtin::BI__builtin_reduce_max:
4715 case Builtin::BI__builtin_elementwise_popcount:
4718 return APInt(Src.getBitWidth(), Src.popcount());
4720 case Builtin::BI__builtin_elementwise_bitreverse:
4722 S, OpPC,
Call, [](
const APSInt &Src) {
return Src.reverseBits(); });
4724 case Builtin::BI__builtin_elementwise_abs:
4727 case Builtin::BI__builtin_memcpy:
4728 case Builtin::BImemcpy:
4729 case Builtin::BI__builtin_wmemcpy:
4730 case Builtin::BIwmemcpy:
4731 case Builtin::BI__builtin_memmove:
4732 case Builtin::BImemmove:
4733 case Builtin::BI__builtin_wmemmove:
4734 case Builtin::BIwmemmove:
4737 case Builtin::BI__builtin_memcmp:
4738 case Builtin::BImemcmp:
4739 case Builtin::BI__builtin_bcmp:
4740 case Builtin::BIbcmp:
4741 case Builtin::BI__builtin_wmemcmp:
4742 case Builtin::BIwmemcmp:
4745 case Builtin::BImemchr:
4746 case Builtin::BI__builtin_memchr:
4747 case Builtin::BIstrchr:
4748 case Builtin::BI__builtin_strchr:
4749 case Builtin::BIwmemchr:
4750 case Builtin::BI__builtin_wmemchr:
4751 case Builtin::BIwcschr:
4752 case Builtin::BI__builtin_wcschr:
4753 case Builtin::BI__builtin_char_memchr:
4756 case Builtin::BI__builtin_object_size:
4757 case Builtin::BI__builtin_dynamic_object_size:
4760 case Builtin::BI__builtin_is_within_lifetime:
4763 case Builtin::BI__builtin_elementwise_add_sat:
4766 return LHS.isSigned() ? LHS.sadd_sat(RHS) : LHS.uadd_sat(RHS);
4769 case Builtin::BI__builtin_elementwise_sub_sat:
4772 return LHS.isSigned() ? LHS.ssub_sat(RHS) : LHS.usub_sat(RHS);
4774 case X86::BI__builtin_ia32_extract128i256:
4775 case X86::BI__builtin_ia32_vextractf128_pd256:
4776 case X86::BI__builtin_ia32_vextractf128_ps256:
4777 case X86::BI__builtin_ia32_vextractf128_si256:
4780 case X86::BI__builtin_ia32_extractf32x4_256_mask:
4781 case X86::BI__builtin_ia32_extractf32x4_mask:
4782 case X86::BI__builtin_ia32_extractf32x8_mask:
4783 case X86::BI__builtin_ia32_extractf64x2_256_mask:
4784 case X86::BI__builtin_ia32_extractf64x2_512_mask:
4785 case X86::BI__builtin_ia32_extractf64x4_mask:
4786 case X86::BI__builtin_ia32_extracti32x4_256_mask:
4787 case X86::BI__builtin_ia32_extracti32x4_mask:
4788 case X86::BI__builtin_ia32_extracti32x8_mask:
4789 case X86::BI__builtin_ia32_extracti64x2_256_mask:
4790 case X86::BI__builtin_ia32_extracti64x2_512_mask:
4791 case X86::BI__builtin_ia32_extracti64x4_mask:
4794 case clang::X86::BI__builtin_ia32_pmulhrsw128:
4795 case clang::X86::BI__builtin_ia32_pmulhrsw256:
4796 case clang::X86::BI__builtin_ia32_pmulhrsw512:
4799 return (llvm::APIntOps::mulsExtended(LHS, RHS).ashr(14) + 1)
4800 .extractBits(16, 1);
4803 case clang::X86::BI__builtin_ia32_movmskps:
4804 case clang::X86::BI__builtin_ia32_movmskpd:
4805 case clang::X86::BI__builtin_ia32_pmovmskb128:
4806 case clang::X86::BI__builtin_ia32_pmovmskb256:
4807 case clang::X86::BI__builtin_ia32_movmskps256:
4808 case clang::X86::BI__builtin_ia32_movmskpd256: {
4812 case X86::BI__builtin_ia32_psignb128:
4813 case X86::BI__builtin_ia32_psignb256:
4814 case X86::BI__builtin_ia32_psignw128:
4815 case X86::BI__builtin_ia32_psignw256:
4816 case X86::BI__builtin_ia32_psignd128:
4817 case X86::BI__builtin_ia32_psignd256:
4821 return APInt::getZero(AElem.getBitWidth());
4822 if (BElem.isNegative())
4827 case clang::X86::BI__builtin_ia32_pavgb128:
4828 case clang::X86::BI__builtin_ia32_pavgw128:
4829 case clang::X86::BI__builtin_ia32_pavgb256:
4830 case clang::X86::BI__builtin_ia32_pavgw256:
4831 case clang::X86::BI__builtin_ia32_pavgb512:
4832 case clang::X86::BI__builtin_ia32_pavgw512:
4834 llvm::APIntOps::avgCeilU);
4836 case clang::X86::BI__builtin_ia32_pmaddubsw128:
4837 case clang::X86::BI__builtin_ia32_pmaddubsw256:
4838 case clang::X86::BI__builtin_ia32_pmaddubsw512:
4843 unsigned BitWidth = 2 * LoLHS.getBitWidth();
4844 return (LoLHS.zext(BitWidth) * LoRHS.sext(BitWidth))
4845 .sadd_sat((HiLHS.zext(BitWidth) * HiRHS.sext(BitWidth)));
4848 case clang::X86::BI__builtin_ia32_pmaddwd128:
4849 case clang::X86::BI__builtin_ia32_pmaddwd256:
4850 case clang::X86::BI__builtin_ia32_pmaddwd512:
4855 unsigned BitWidth = 2 * LoLHS.getBitWidth();
4856 return (LoLHS.sext(BitWidth) * LoRHS.sext(BitWidth)) +
4857 (HiLHS.sext(BitWidth) * HiRHS.sext(BitWidth));
4860 case clang::X86::BI__builtin_ia32_pmulhuw128:
4861 case clang::X86::BI__builtin_ia32_pmulhuw256:
4862 case clang::X86::BI__builtin_ia32_pmulhuw512:
4864 llvm::APIntOps::mulhu);
4866 case clang::X86::BI__builtin_ia32_pmulhw128:
4867 case clang::X86::BI__builtin_ia32_pmulhw256:
4868 case clang::X86::BI__builtin_ia32_pmulhw512:
4870 llvm::APIntOps::mulhs);
4872 case clang::X86::BI__builtin_ia32_psllv2di:
4873 case clang::X86::BI__builtin_ia32_psllv4di:
4874 case clang::X86::BI__builtin_ia32_psllv4si:
4875 case clang::X86::BI__builtin_ia32_psllv8di:
4876 case clang::X86::BI__builtin_ia32_psllv8hi:
4877 case clang::X86::BI__builtin_ia32_psllv8si:
4878 case clang::X86::BI__builtin_ia32_psllv16hi:
4879 case clang::X86::BI__builtin_ia32_psllv16si:
4880 case clang::X86::BI__builtin_ia32_psllv32hi:
4881 case clang::X86::BI__builtin_ia32_psllwi128:
4882 case clang::X86::BI__builtin_ia32_psllwi256:
4883 case clang::X86::BI__builtin_ia32_psllwi512:
4884 case clang::X86::BI__builtin_ia32_pslldi128:
4885 case clang::X86::BI__builtin_ia32_pslldi256:
4886 case clang::X86::BI__builtin_ia32_pslldi512:
4887 case clang::X86::BI__builtin_ia32_psllqi128:
4888 case clang::X86::BI__builtin_ia32_psllqi256:
4889 case clang::X86::BI__builtin_ia32_psllqi512:
4892 if (RHS.uge(LHS.getBitWidth())) {
4893 return APInt::getZero(LHS.getBitWidth());
4895 return LHS.shl(RHS.getZExtValue());
4898 case clang::X86::BI__builtin_ia32_psrav4si:
4899 case clang::X86::BI__builtin_ia32_psrav8di:
4900 case clang::X86::BI__builtin_ia32_psrav8hi:
4901 case clang::X86::BI__builtin_ia32_psrav8si:
4902 case clang::X86::BI__builtin_ia32_psrav16hi:
4903 case clang::X86::BI__builtin_ia32_psrav16si:
4904 case clang::X86::BI__builtin_ia32_psrav32hi:
4905 case clang::X86::BI__builtin_ia32_psravq128:
4906 case clang::X86::BI__builtin_ia32_psravq256:
4907 case clang::X86::BI__builtin_ia32_psrawi128:
4908 case clang::X86::BI__builtin_ia32_psrawi256:
4909 case clang::X86::BI__builtin_ia32_psrawi512:
4910 case clang::X86::BI__builtin_ia32_psradi128:
4911 case clang::X86::BI__builtin_ia32_psradi256:
4912 case clang::X86::BI__builtin_ia32_psradi512:
4913 case clang::X86::BI__builtin_ia32_psraqi128:
4914 case clang::X86::BI__builtin_ia32_psraqi256:
4915 case clang::X86::BI__builtin_ia32_psraqi512:
4918 if (RHS.uge(LHS.getBitWidth())) {
4919 return LHS.ashr(LHS.getBitWidth() - 1);
4921 return LHS.ashr(RHS.getZExtValue());
4924 case clang::X86::BI__builtin_ia32_psrlv2di:
4925 case clang::X86::BI__builtin_ia32_psrlv4di:
4926 case clang::X86::BI__builtin_ia32_psrlv4si:
4927 case clang::X86::BI__builtin_ia32_psrlv8di:
4928 case clang::X86::BI__builtin_ia32_psrlv8hi:
4929 case clang::X86::BI__builtin_ia32_psrlv8si:
4930 case clang::X86::BI__builtin_ia32_psrlv16hi:
4931 case clang::X86::BI__builtin_ia32_psrlv16si:
4932 case clang::X86::BI__builtin_ia32_psrlv32hi:
4933 case clang::X86::BI__builtin_ia32_psrlwi128:
4934 case clang::X86::BI__builtin_ia32_psrlwi256:
4935 case clang::X86::BI__builtin_ia32_psrlwi512:
4936 case clang::X86::BI__builtin_ia32_psrldi128:
4937 case clang::X86::BI__builtin_ia32_psrldi256:
4938 case clang::X86::BI__builtin_ia32_psrldi512:
4939 case clang::X86::BI__builtin_ia32_psrlqi128:
4940 case clang::X86::BI__builtin_ia32_psrlqi256:
4941 case clang::X86::BI__builtin_ia32_psrlqi512:
4944 if (RHS.uge(LHS.getBitWidth())) {
4945 return APInt::getZero(LHS.getBitWidth());
4947 return LHS.lshr(RHS.getZExtValue());
4949 case clang::X86::BI__builtin_ia32_packsswb128:
4950 case clang::X86::BI__builtin_ia32_packsswb256:
4951 case clang::X86::BI__builtin_ia32_packsswb512:
4952 case clang::X86::BI__builtin_ia32_packssdw128:
4953 case clang::X86::BI__builtin_ia32_packssdw256:
4954 case clang::X86::BI__builtin_ia32_packssdw512:
4956 return APInt(Src).truncSSat(Src.getBitWidth() / 2);
4958 case clang::X86::BI__builtin_ia32_packusdw128:
4959 case clang::X86::BI__builtin_ia32_packusdw256:
4960 case clang::X86::BI__builtin_ia32_packusdw512:
4961 case clang::X86::BI__builtin_ia32_packuswb128:
4962 case clang::X86::BI__builtin_ia32_packuswb256:
4963 case clang::X86::BI__builtin_ia32_packuswb512:
4965 return APInt(Src).truncSSatU(Src.getBitWidth() / 2);
4968 case clang::X86::BI__builtin_ia32_selectss_128:
4969 case clang::X86::BI__builtin_ia32_selectsd_128:
4970 case clang::X86::BI__builtin_ia32_selectsh_128:
4971 case clang::X86::BI__builtin_ia32_selectsbf_128:
4973 case clang::X86::BI__builtin_ia32_vprotbi:
4974 case clang::X86::BI__builtin_ia32_vprotdi:
4975 case clang::X86::BI__builtin_ia32_vprotqi:
4976 case clang::X86::BI__builtin_ia32_vprotwi:
4977 case clang::X86::BI__builtin_ia32_prold128:
4978 case clang::X86::BI__builtin_ia32_prold256:
4979 case clang::X86::BI__builtin_ia32_prold512:
4980 case clang::X86::BI__builtin_ia32_prolq128:
4981 case clang::X86::BI__builtin_ia32_prolq256:
4982 case clang::X86::BI__builtin_ia32_prolq512:
4985 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS.rotl(RHS); });
4987 case clang::X86::BI__builtin_ia32_prord128:
4988 case clang::X86::BI__builtin_ia32_prord256:
4989 case clang::X86::BI__builtin_ia32_prord512:
4990 case clang::X86::BI__builtin_ia32_prorq128:
4991 case clang::X86::BI__builtin_ia32_prorq256:
4992 case clang::X86::BI__builtin_ia32_prorq512:
4995 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS.rotr(RHS); });
4997 case Builtin::BI__builtin_elementwise_max:
4998 case Builtin::BI__builtin_elementwise_min:
5001 case clang::X86::BI__builtin_ia32_phaddw128:
5002 case clang::X86::BI__builtin_ia32_phaddw256:
5003 case clang::X86::BI__builtin_ia32_phaddd128:
5004 case clang::X86::BI__builtin_ia32_phaddd256:
5007 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS + RHS; });
5008 case clang::X86::BI__builtin_ia32_phaddsw128:
5009 case clang::X86::BI__builtin_ia32_phaddsw256:
5012 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS.sadd_sat(RHS); });
5013 case clang::X86::BI__builtin_ia32_phsubw128:
5014 case clang::X86::BI__builtin_ia32_phsubw256:
5015 case clang::X86::BI__builtin_ia32_phsubd128:
5016 case clang::X86::BI__builtin_ia32_phsubd256:
5019 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS - RHS; });
5020 case clang::X86::BI__builtin_ia32_phsubsw128:
5021 case clang::X86::BI__builtin_ia32_phsubsw256:
5024 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS.ssub_sat(RHS); });
5025 case clang::X86::BI__builtin_ia32_haddpd:
5026 case clang::X86::BI__builtin_ia32_haddps:
5027 case clang::X86::BI__builtin_ia32_haddpd256:
5028 case clang::X86::BI__builtin_ia32_haddps256:
5031 [](
const APFloat &LHS,
const APFloat &RHS, llvm::RoundingMode RM) {
5036 case clang::X86::BI__builtin_ia32_hsubpd:
5037 case clang::X86::BI__builtin_ia32_hsubps:
5038 case clang::X86::BI__builtin_ia32_hsubpd256:
5039 case clang::X86::BI__builtin_ia32_hsubps256:
5042 [](
const APFloat &LHS,
const APFloat &RHS, llvm::RoundingMode RM) {
5044 F.subtract(RHS, RM);
5047 case clang::X86::BI__builtin_ia32_addsubpd:
5048 case clang::X86::BI__builtin_ia32_addsubps:
5049 case clang::X86::BI__builtin_ia32_addsubpd256:
5050 case clang::X86::BI__builtin_ia32_addsubps256:
5053 case clang::X86::BI__builtin_ia32_pmuldq128:
5054 case clang::X86::BI__builtin_ia32_pmuldq256:
5055 case clang::X86::BI__builtin_ia32_pmuldq512:
5060 return llvm::APIntOps::mulsExtended(LoLHS, LoRHS);
5063 case clang::X86::BI__builtin_ia32_pmuludq128:
5064 case clang::X86::BI__builtin_ia32_pmuludq256:
5065 case clang::X86::BI__builtin_ia32_pmuludq512:
5070 return llvm::APIntOps::muluExtended(LoLHS, LoRHS);
5073 case clang::X86::BI__builtin_ia32_pclmulqdq128:
5074 case clang::X86::BI__builtin_ia32_pclmulqdq256:
5075 case clang::X86::BI__builtin_ia32_pclmulqdq512:
5078 case Builtin::BI__builtin_elementwise_fma:
5082 llvm::RoundingMode RM) {
5084 F.fusedMultiplyAdd(Y, Z, RM);
5088 case X86::BI__builtin_ia32_vpmadd52luq128:
5089 case X86::BI__builtin_ia32_vpmadd52luq256:
5090 case X86::BI__builtin_ia32_vpmadd52luq512:
5093 return A + (B.trunc(52) *
C.trunc(52)).zext(64);
5095 case X86::BI__builtin_ia32_vpmadd52huq128:
5096 case X86::BI__builtin_ia32_vpmadd52huq256:
5097 case X86::BI__builtin_ia32_vpmadd52huq512:
5100 return A + llvm::APIntOps::mulhu(B.trunc(52),
C.trunc(52)).zext(64);
5103 case X86::BI__builtin_ia32_vpshldd128:
5104 case X86::BI__builtin_ia32_vpshldd256:
5105 case X86::BI__builtin_ia32_vpshldd512:
5106 case X86::BI__builtin_ia32_vpshldq128:
5107 case X86::BI__builtin_ia32_vpshldq256:
5108 case X86::BI__builtin_ia32_vpshldq512:
5109 case X86::BI__builtin_ia32_vpshldw128:
5110 case X86::BI__builtin_ia32_vpshldw256:
5111 case X86::BI__builtin_ia32_vpshldw512:
5115 return llvm::APIntOps::fshl(Hi, Lo, Amt);
5118 case X86::BI__builtin_ia32_vpshrdd128:
5119 case X86::BI__builtin_ia32_vpshrdd256:
5120 case X86::BI__builtin_ia32_vpshrdd512:
5121 case X86::BI__builtin_ia32_vpshrdq128:
5122 case X86::BI__builtin_ia32_vpshrdq256:
5123 case X86::BI__builtin_ia32_vpshrdq512:
5124 case X86::BI__builtin_ia32_vpshrdw128:
5125 case X86::BI__builtin_ia32_vpshrdw256:
5126 case X86::BI__builtin_ia32_vpshrdw512:
5131 return llvm::APIntOps::fshr(Hi, Lo, Amt);
5133 case X86::BI__builtin_ia32_vpconflictsi_128:
5134 case X86::BI__builtin_ia32_vpconflictsi_256:
5135 case X86::BI__builtin_ia32_vpconflictsi_512:
5136 case X86::BI__builtin_ia32_vpconflictdi_128:
5137 case X86::BI__builtin_ia32_vpconflictdi_256:
5138 case X86::BI__builtin_ia32_vpconflictdi_512:
5140 case X86::BI__builtin_ia32_compressdf128_mask:
5141 case X86::BI__builtin_ia32_compressdf256_mask:
5142 case X86::BI__builtin_ia32_compressdf512_mask:
5143 case X86::BI__builtin_ia32_compressdi128_mask:
5144 case X86::BI__builtin_ia32_compressdi256_mask:
5145 case X86::BI__builtin_ia32_compressdi512_mask:
5146 case X86::BI__builtin_ia32_compresshi128_mask:
5147 case X86::BI__builtin_ia32_compresshi256_mask:
5148 case X86::BI__builtin_ia32_compresshi512_mask:
5149 case X86::BI__builtin_ia32_compressqi128_mask:
5150 case X86::BI__builtin_ia32_compressqi256_mask:
5151 case X86::BI__builtin_ia32_compressqi512_mask:
5152 case X86::BI__builtin_ia32_compresssf128_mask:
5153 case X86::BI__builtin_ia32_compresssf256_mask:
5154 case X86::BI__builtin_ia32_compresssf512_mask:
5155 case X86::BI__builtin_ia32_compresssi128_mask:
5156 case X86::BI__builtin_ia32_compresssi256_mask:
5157 case X86::BI__builtin_ia32_compresssi512_mask: {
5159 Call->getArg(0)->getType()->castAs<
VectorType>()->getNumElements();
5161 S, OpPC,
Call, [NumElems](
unsigned DstIdx,
const APInt &ShuffleMask) {
5162 APInt CompressMask = ShuffleMask.trunc(NumElems);
5163 if (DstIdx < CompressMask.popcount()) {
5164 while (DstIdx != 0) {
5165 CompressMask = CompressMask & (CompressMask - 1);
5168 return std::pair<unsigned, int>{
5169 0,
static_cast<int>(CompressMask.countr_zero())};
5171 return std::pair<unsigned, int>{1,
static_cast<int>(DstIdx)};
5174 case X86::BI__builtin_ia32_expanddf128_mask:
5175 case X86::BI__builtin_ia32_expanddf256_mask:
5176 case X86::BI__builtin_ia32_expanddf512_mask:
5177 case X86::BI__builtin_ia32_expanddi128_mask:
5178 case X86::BI__builtin_ia32_expanddi256_mask:
5179 case X86::BI__builtin_ia32_expanddi512_mask:
5180 case X86::BI__builtin_ia32_expandhi128_mask:
5181 case X86::BI__builtin_ia32_expandhi256_mask:
5182 case X86::BI__builtin_ia32_expandhi512_mask:
5183 case X86::BI__builtin_ia32_expandqi128_mask:
5184 case X86::BI__builtin_ia32_expandqi256_mask:
5185 case X86::BI__builtin_ia32_expandqi512_mask:
5186 case X86::BI__builtin_ia32_expandsf128_mask:
5187 case X86::BI__builtin_ia32_expandsf256_mask:
5188 case X86::BI__builtin_ia32_expandsf512_mask:
5189 case X86::BI__builtin_ia32_expandsi128_mask:
5190 case X86::BI__builtin_ia32_expandsi256_mask:
5191 case X86::BI__builtin_ia32_expandsi512_mask: {
5193 S, OpPC,
Call, [](
unsigned DstIdx,
const APInt &ShuffleMask) {
5196 APInt ExpandMask = ShuffleMask.trunc(DstIdx + 1);
5197 if (ExpandMask[DstIdx]) {
5198 int SrcIdx = ExpandMask.popcount() - 1;
5199 return std::pair<unsigned, int>{0, SrcIdx};
5201 return std::pair<unsigned, int>{1,
static_cast<int>(DstIdx)};
5204 case clang::X86::BI__builtin_ia32_blendpd:
5205 case clang::X86::BI__builtin_ia32_blendpd256:
5206 case clang::X86::BI__builtin_ia32_blendps:
5207 case clang::X86::BI__builtin_ia32_blendps256:
5208 case clang::X86::BI__builtin_ia32_pblendw128:
5209 case clang::X86::BI__builtin_ia32_pblendw256:
5210 case clang::X86::BI__builtin_ia32_pblendd128:
5211 case clang::X86::BI__builtin_ia32_pblendd256:
5213 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5215 unsigned MaskBit = (ShuffleMask >> (DstIdx % 8)) & 0x1;
5216 unsigned SrcVecIdx = MaskBit ? 1 : 0;
5217 return std::pair<unsigned, int>{SrcVecIdx,
static_cast<int>(DstIdx)};
5222 case clang::X86::BI__builtin_ia32_blendvpd:
5223 case clang::X86::BI__builtin_ia32_blendvpd256:
5224 case clang::X86::BI__builtin_ia32_blendvps:
5225 case clang::X86::BI__builtin_ia32_blendvps256:
5229 llvm::RoundingMode) {
return C.isNegative() ? T : F; });
5231 case clang::X86::BI__builtin_ia32_pblendvb128:
5232 case clang::X86::BI__builtin_ia32_pblendvb256:
5235 return ((
APInt)
C).isNegative() ? T : F;
5237 case X86::BI__builtin_ia32_ptestz128:
5238 case X86::BI__builtin_ia32_ptestz256:
5239 case X86::BI__builtin_ia32_vtestzps:
5240 case X86::BI__builtin_ia32_vtestzps256:
5241 case X86::BI__builtin_ia32_vtestzpd:
5242 case X86::BI__builtin_ia32_vtestzpd256:
5245 [](
const APInt &A,
const APInt &B) {
return (A & B) == 0; });
5246 case X86::BI__builtin_ia32_ptestc128:
5247 case X86::BI__builtin_ia32_ptestc256:
5248 case X86::BI__builtin_ia32_vtestcps:
5249 case X86::BI__builtin_ia32_vtestcps256:
5250 case X86::BI__builtin_ia32_vtestcpd:
5251 case X86::BI__builtin_ia32_vtestcpd256:
5254 [](
const APInt &A,
const APInt &B) {
return (~A & B) == 0; });
5255 case X86::BI__builtin_ia32_ptestnzc128:
5256 case X86::BI__builtin_ia32_ptestnzc256:
5257 case X86::BI__builtin_ia32_vtestnzcps:
5258 case X86::BI__builtin_ia32_vtestnzcps256:
5259 case X86::BI__builtin_ia32_vtestnzcpd:
5260 case X86::BI__builtin_ia32_vtestnzcpd256:
5263 return ((A & B) != 0) && ((~A & B) != 0);
5265 case X86::BI__builtin_ia32_selectb_128:
5266 case X86::BI__builtin_ia32_selectb_256:
5267 case X86::BI__builtin_ia32_selectb_512:
5268 case X86::BI__builtin_ia32_selectw_128:
5269 case X86::BI__builtin_ia32_selectw_256:
5270 case X86::BI__builtin_ia32_selectw_512:
5271 case X86::BI__builtin_ia32_selectd_128:
5272 case X86::BI__builtin_ia32_selectd_256:
5273 case X86::BI__builtin_ia32_selectd_512:
5274 case X86::BI__builtin_ia32_selectq_128:
5275 case X86::BI__builtin_ia32_selectq_256:
5276 case X86::BI__builtin_ia32_selectq_512:
5277 case X86::BI__builtin_ia32_selectph_128:
5278 case X86::BI__builtin_ia32_selectph_256:
5279 case X86::BI__builtin_ia32_selectph_512:
5280 case X86::BI__builtin_ia32_selectpbf_128:
5281 case X86::BI__builtin_ia32_selectpbf_256:
5282 case X86::BI__builtin_ia32_selectpbf_512:
5283 case X86::BI__builtin_ia32_selectps_128:
5284 case X86::BI__builtin_ia32_selectps_256:
5285 case X86::BI__builtin_ia32_selectps_512:
5286 case X86::BI__builtin_ia32_selectpd_128:
5287 case X86::BI__builtin_ia32_selectpd_256:
5288 case X86::BI__builtin_ia32_selectpd_512:
5291 case X86::BI__builtin_ia32_shufps:
5292 case X86::BI__builtin_ia32_shufps256:
5293 case X86::BI__builtin_ia32_shufps512:
5295 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5296 unsigned NumElemPerLane = 4;
5297 unsigned NumSelectableElems = NumElemPerLane / 2;
5298 unsigned BitsPerElem = 2;
5299 unsigned IndexMask = 0x3;
5300 unsigned MaskBits = 8;
5301 unsigned Lane = DstIdx / NumElemPerLane;
5302 unsigned ElemInLane = DstIdx % NumElemPerLane;
5303 unsigned LaneOffset = Lane * NumElemPerLane;
5304 unsigned SrcIdx = ElemInLane >= NumSelectableElems ? 1 : 0;
5305 unsigned BitIndex = (DstIdx * BitsPerElem) % MaskBits;
5306 unsigned Index = (ShuffleMask >> BitIndex) & IndexMask;
5307 return std::pair<unsigned, int>{SrcIdx,
5308 static_cast<int>(LaneOffset + Index)};
5310 case X86::BI__builtin_ia32_shufpd:
5311 case X86::BI__builtin_ia32_shufpd256:
5312 case X86::BI__builtin_ia32_shufpd512:
5314 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5315 unsigned NumElemPerLane = 2;
5316 unsigned NumSelectableElems = NumElemPerLane / 2;
5317 unsigned BitsPerElem = 1;
5318 unsigned IndexMask = 0x1;
5319 unsigned MaskBits = 8;
5320 unsigned Lane = DstIdx / NumElemPerLane;
5321 unsigned ElemInLane = DstIdx % NumElemPerLane;
5322 unsigned LaneOffset = Lane * NumElemPerLane;
5323 unsigned SrcIdx = ElemInLane >= NumSelectableElems ? 1 : 0;
5324 unsigned BitIndex = (DstIdx * BitsPerElem) % MaskBits;
5325 unsigned Index = (ShuffleMask >> BitIndex) & IndexMask;
5326 return std::pair<unsigned, int>{SrcIdx,
5327 static_cast<int>(LaneOffset + Index)};
5330 case X86::BI__builtin_ia32_vgf2p8affineinvqb_v16qi:
5331 case X86::BI__builtin_ia32_vgf2p8affineinvqb_v32qi:
5332 case X86::BI__builtin_ia32_vgf2p8affineinvqb_v64qi:
5334 case X86::BI__builtin_ia32_vgf2p8affineqb_v16qi:
5335 case X86::BI__builtin_ia32_vgf2p8affineqb_v32qi:
5336 case X86::BI__builtin_ia32_vgf2p8affineqb_v64qi:
5339 case X86::BI__builtin_ia32_vgf2p8mulb_v16qi:
5340 case X86::BI__builtin_ia32_vgf2p8mulb_v32qi:
5341 case X86::BI__builtin_ia32_vgf2p8mulb_v64qi:
5344 case X86::BI__builtin_ia32_insertps128:
5346 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned Mask) {
5348 if ((Mask & (1 << DstIdx)) != 0) {
5349 return std::pair<unsigned, int>{0, -1};
5353 unsigned SrcElem = (Mask >> 6) & 0x3;
5354 unsigned DstElem = (Mask >> 4) & 0x3;
5355 if (DstIdx == DstElem) {
5357 return std::pair<unsigned, int>{1,
static_cast<int>(SrcElem)};
5360 return std::pair<unsigned, int>{0,
static_cast<int>(DstIdx)};
5363 case X86::BI__builtin_ia32_permvarsi256:
5364 case X86::BI__builtin_ia32_permvarsf256:
5365 case X86::BI__builtin_ia32_permvardf512:
5366 case X86::BI__builtin_ia32_permvardi512:
5367 case X86::BI__builtin_ia32_permvarhi128:
5369 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5370 int Offset = ShuffleMask & 0x7;
5371 return std::pair<unsigned, int>{0, Offset};
5373 case X86::BI__builtin_ia32_permvarqi128:
5374 case X86::BI__builtin_ia32_permvarhi256:
5375 case X86::BI__builtin_ia32_permvarsi512:
5376 case X86::BI__builtin_ia32_permvarsf512:
5378 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5379 int Offset = ShuffleMask & 0xF;
5380 return std::pair<unsigned, int>{0, Offset};
5382 case X86::BI__builtin_ia32_permvardi256:
5383 case X86::BI__builtin_ia32_permvardf256:
5385 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5386 int Offset = ShuffleMask & 0x3;
5387 return std::pair<unsigned, int>{0, Offset};
5389 case X86::BI__builtin_ia32_permvarqi256:
5390 case X86::BI__builtin_ia32_permvarhi512:
5392 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5393 int Offset = ShuffleMask & 0x1F;
5394 return std::pair<unsigned, int>{0, Offset};
5396 case X86::BI__builtin_ia32_permvarqi512:
5398 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5399 int Offset = ShuffleMask & 0x3F;
5400 return std::pair<unsigned, int>{0, Offset};
5402 case X86::BI__builtin_ia32_vpermi2varq128:
5403 case X86::BI__builtin_ia32_vpermi2varpd128:
5405 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5406 int Offset = ShuffleMask & 0x1;
5407 unsigned SrcIdx = (ShuffleMask >> 1) & 0x1;
5408 return std::pair<unsigned, int>{SrcIdx, Offset};
5410 case X86::BI__builtin_ia32_vpermi2vard128:
5411 case X86::BI__builtin_ia32_vpermi2varps128:
5412 case X86::BI__builtin_ia32_vpermi2varq256:
5413 case X86::BI__builtin_ia32_vpermi2varpd256:
5415 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5416 int Offset = ShuffleMask & 0x3;
5417 unsigned SrcIdx = (ShuffleMask >> 2) & 0x1;
5418 return std::pair<unsigned, int>{SrcIdx, Offset};
5420 case X86::BI__builtin_ia32_vpermi2varhi128:
5421 case X86::BI__builtin_ia32_vpermi2vard256:
5422 case X86::BI__builtin_ia32_vpermi2varps256:
5423 case X86::BI__builtin_ia32_vpermi2varq512:
5424 case X86::BI__builtin_ia32_vpermi2varpd512:
5426 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5427 int Offset = ShuffleMask & 0x7;
5428 unsigned SrcIdx = (ShuffleMask >> 3) & 0x1;
5429 return std::pair<unsigned, int>{SrcIdx, Offset};
5431 case X86::BI__builtin_ia32_vpermi2varqi128:
5432 case X86::BI__builtin_ia32_vpermi2varhi256:
5433 case X86::BI__builtin_ia32_vpermi2vard512:
5434 case X86::BI__builtin_ia32_vpermi2varps512:
5436 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5437 int Offset = ShuffleMask & 0xF;
5438 unsigned SrcIdx = (ShuffleMask >> 4) & 0x1;
5439 return std::pair<unsigned, int>{SrcIdx, Offset};
5441 case X86::BI__builtin_ia32_vpermi2varqi256:
5442 case X86::BI__builtin_ia32_vpermi2varhi512:
5444 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5445 int Offset = ShuffleMask & 0x1F;
5446 unsigned SrcIdx = (ShuffleMask >> 5) & 0x1;
5447 return std::pair<unsigned, int>{SrcIdx, Offset};
5449 case X86::BI__builtin_ia32_vpermi2varqi512:
5451 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5452 int Offset = ShuffleMask & 0x3F;
5453 unsigned SrcIdx = (ShuffleMask >> 6) & 0x1;
5454 return std::pair<unsigned, int>{SrcIdx, Offset};
5456 case X86::BI__builtin_ia32_vperm2f128_pd256:
5457 case X86::BI__builtin_ia32_vperm2f128_ps256:
5458 case X86::BI__builtin_ia32_vperm2f128_si256:
5459 case X86::BI__builtin_ia32_permti256: {
5460 unsigned NumElements =
5461 Call->getArg(0)->getType()->castAs<
VectorType>()->getNumElements();
5462 unsigned PreservedBitsCnt = NumElements >> 2;
5465 [PreservedBitsCnt](
unsigned DstIdx,
unsigned ShuffleMask) {
5466 unsigned ControlBitsCnt = DstIdx >> PreservedBitsCnt << 2;
5467 unsigned ControlBits = ShuffleMask >> ControlBitsCnt;
5469 if (ControlBits & 0b1000)
5470 return std::make_pair(0u, -1);
5472 unsigned SrcVecIdx = (ControlBits & 0b10) >> 1;
5473 unsigned PreservedBitsMask = (1 << PreservedBitsCnt) - 1;
5474 int SrcIdx = ((ControlBits & 0b1) << PreservedBitsCnt) |
5475 (DstIdx & PreservedBitsMask);
5476 return std::make_pair(SrcVecIdx, SrcIdx);
5479 case X86::BI__builtin_ia32_pshufb128:
5480 case X86::BI__builtin_ia32_pshufb256:
5481 case X86::BI__builtin_ia32_pshufb512:
5483 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5484 uint8_t Ctlb =
static_cast<uint8_t
>(ShuffleMask);
5486 return std::make_pair(0, -1);
5488 unsigned LaneBase = (DstIdx / 16) * 16;
5489 unsigned SrcOffset = Ctlb & 0x0F;
5490 unsigned SrcIdx = LaneBase + SrcOffset;
5491 return std::make_pair(0,
static_cast<int>(SrcIdx));
5494 case X86::BI__builtin_ia32_pshuflw:
5495 case X86::BI__builtin_ia32_pshuflw256:
5496 case X86::BI__builtin_ia32_pshuflw512:
5498 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5499 unsigned LaneBase = (DstIdx / 8) * 8;
5500 unsigned LaneIdx = DstIdx % 8;
5502 unsigned Sel = (ShuffleMask >> (2 * LaneIdx)) & 0x3;
5503 return std::make_pair(0,
static_cast<int>(LaneBase + Sel));
5506 return std::make_pair(0,
static_cast<int>(DstIdx));
5509 case X86::BI__builtin_ia32_pshufhw:
5510 case X86::BI__builtin_ia32_pshufhw256:
5511 case X86::BI__builtin_ia32_pshufhw512:
5513 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5514 unsigned LaneBase = (DstIdx / 8) * 8;
5515 unsigned LaneIdx = DstIdx % 8;
5517 unsigned Sel = (ShuffleMask >> (2 * (LaneIdx - 4))) & 0x3;
5518 return std::make_pair(0,
static_cast<int>(LaneBase + 4 + Sel));
5521 return std::make_pair(0,
static_cast<int>(DstIdx));
5524 case X86::BI__builtin_ia32_pshufd:
5525 case X86::BI__builtin_ia32_pshufd256:
5526 case X86::BI__builtin_ia32_pshufd512:
5527 case X86::BI__builtin_ia32_vpermilps:
5528 case X86::BI__builtin_ia32_vpermilps256:
5529 case X86::BI__builtin_ia32_vpermilps512:
5531 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5532 unsigned LaneBase = (DstIdx / 4) * 4;
5533 unsigned LaneIdx = DstIdx % 4;
5534 unsigned Sel = (ShuffleMask >> (2 * LaneIdx)) & 0x3;
5535 return std::make_pair(0,
static_cast<int>(LaneBase + Sel));
5538 case X86::BI__builtin_ia32_vpermilvarpd:
5539 case X86::BI__builtin_ia32_vpermilvarpd256:
5540 case X86::BI__builtin_ia32_vpermilvarpd512:
5542 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5543 unsigned NumElemPerLane = 2;
5544 unsigned Lane = DstIdx / NumElemPerLane;
5545 unsigned Offset = ShuffleMask & 0b10 ? 1 : 0;
5546 return std::make_pair(
5547 0,
static_cast<int>(Lane * NumElemPerLane + Offset));
5550 case X86::BI__builtin_ia32_vpermilvarps:
5551 case X86::BI__builtin_ia32_vpermilvarps256:
5552 case X86::BI__builtin_ia32_vpermilvarps512:
5554 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5555 unsigned NumElemPerLane = 4;
5556 unsigned Lane = DstIdx / NumElemPerLane;
5557 unsigned Offset = ShuffleMask & 0b11;
5558 return std::make_pair(
5559 0,
static_cast<int>(Lane * NumElemPerLane + Offset));
5562 case X86::BI__builtin_ia32_vpermilpd:
5563 case X86::BI__builtin_ia32_vpermilpd256:
5564 case X86::BI__builtin_ia32_vpermilpd512:
5566 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned Control) {
5567 unsigned NumElemPerLane = 2;
5568 unsigned BitsPerElem = 1;
5569 unsigned MaskBits = 8;
5570 unsigned IndexMask = 0x1;
5571 unsigned Lane = DstIdx / NumElemPerLane;
5572 unsigned LaneOffset = Lane * NumElemPerLane;
5573 unsigned BitIndex = (DstIdx * BitsPerElem) % MaskBits;
5574 unsigned Index = (Control >> BitIndex) & IndexMask;
5575 return std::make_pair(0,
static_cast<int>(LaneOffset + Index));
5578 case X86::BI__builtin_ia32_permdf256:
5579 case X86::BI__builtin_ia32_permdi256:
5581 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned Control) {
5584 unsigned Index = (Control >> (2 * DstIdx)) & 0x3;
5585 return std::make_pair(0,
static_cast<int>(Index));
5588 case X86::BI__builtin_ia32_vpmultishiftqb128:
5589 case X86::BI__builtin_ia32_vpmultishiftqb256:
5590 case X86::BI__builtin_ia32_vpmultishiftqb512:
5592 case X86::BI__builtin_ia32_kandqi:
5593 case X86::BI__builtin_ia32_kandhi:
5594 case X86::BI__builtin_ia32_kandsi:
5595 case X86::BI__builtin_ia32_kanddi:
5598 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS & RHS; });
5600 case X86::BI__builtin_ia32_kandnqi:
5601 case X86::BI__builtin_ia32_kandnhi:
5602 case X86::BI__builtin_ia32_kandnsi:
5603 case X86::BI__builtin_ia32_kandndi:
5606 [](
const APSInt &LHS,
const APSInt &RHS) {
return ~LHS & RHS; });
5608 case X86::BI__builtin_ia32_korqi:
5609 case X86::BI__builtin_ia32_korhi:
5610 case X86::BI__builtin_ia32_korsi:
5611 case X86::BI__builtin_ia32_kordi:
5614 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS | RHS; });
5616 case X86::BI__builtin_ia32_kxnorqi:
5617 case X86::BI__builtin_ia32_kxnorhi:
5618 case X86::BI__builtin_ia32_kxnorsi:
5619 case X86::BI__builtin_ia32_kxnordi:
5622 [](
const APSInt &LHS,
const APSInt &RHS) {
return ~(LHS ^ RHS); });
5624 case X86::BI__builtin_ia32_kxorqi:
5625 case X86::BI__builtin_ia32_kxorhi:
5626 case X86::BI__builtin_ia32_kxorsi:
5627 case X86::BI__builtin_ia32_kxordi:
5630 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS ^ RHS; });
5632 case X86::BI__builtin_ia32_knotqi:
5633 case X86::BI__builtin_ia32_knothi:
5634 case X86::BI__builtin_ia32_knotsi:
5635 case X86::BI__builtin_ia32_knotdi:
5637 S, OpPC,
Call, [](
const APSInt &Src) {
return ~Src; });
5639 case X86::BI__builtin_ia32_kaddqi:
5640 case X86::BI__builtin_ia32_kaddhi:
5641 case X86::BI__builtin_ia32_kaddsi:
5642 case X86::BI__builtin_ia32_kadddi:
5645 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS + RHS; });
5647 case X86::BI__builtin_ia32_kmovb:
5648 case X86::BI__builtin_ia32_kmovw:
5649 case X86::BI__builtin_ia32_kmovd:
5650 case X86::BI__builtin_ia32_kmovq:
5652 S, OpPC,
Call, [](
const APSInt &Src) {
return Src; });
5654 case X86::BI__builtin_ia32_kunpckhi:
5655 case X86::BI__builtin_ia32_kunpckdi:
5656 case X86::BI__builtin_ia32_kunpcksi:
5661 unsigned BW = A.getBitWidth();
5662 return APSInt(A.trunc(BW / 2).concat(B.trunc(BW / 2)),
5666 case X86::BI__builtin_ia32_phminposuw128:
5669 case X86::BI__builtin_ia32_psraq128:
5670 case X86::BI__builtin_ia32_psraq256:
5671 case X86::BI__builtin_ia32_psraq512:
5672 case X86::BI__builtin_ia32_psrad128:
5673 case X86::BI__builtin_ia32_psrad256:
5674 case X86::BI__builtin_ia32_psrad512:
5675 case X86::BI__builtin_ia32_psraw128:
5676 case X86::BI__builtin_ia32_psraw256:
5677 case X86::BI__builtin_ia32_psraw512:
5680 [](
const APInt &Elt, uint64_t Count) {
return Elt.ashr(Count); },
5681 [](
const APInt &Elt,
unsigned Width) {
return Elt.ashr(Width - 1); });
5683 case X86::BI__builtin_ia32_psllq128:
5684 case X86::BI__builtin_ia32_psllq256:
5685 case X86::BI__builtin_ia32_psllq512:
5686 case X86::BI__builtin_ia32_pslld128:
5687 case X86::BI__builtin_ia32_pslld256:
5688 case X86::BI__builtin_ia32_pslld512:
5689 case X86::BI__builtin_ia32_psllw128:
5690 case X86::BI__builtin_ia32_psllw256:
5691 case X86::BI__builtin_ia32_psllw512:
5694 [](
const APInt &Elt, uint64_t Count) {
return Elt.shl(Count); },
5695 [](
const APInt &Elt,
unsigned Width) {
return APInt::getZero(Width); });
5697 case X86::BI__builtin_ia32_psrlq128:
5698 case X86::BI__builtin_ia32_psrlq256:
5699 case X86::BI__builtin_ia32_psrlq512:
5700 case X86::BI__builtin_ia32_psrld128:
5701 case X86::BI__builtin_ia32_psrld256:
5702 case X86::BI__builtin_ia32_psrld512:
5703 case X86::BI__builtin_ia32_psrlw128:
5704 case X86::BI__builtin_ia32_psrlw256:
5705 case X86::BI__builtin_ia32_psrlw512:
5708 [](
const APInt &Elt, uint64_t Count) {
return Elt.lshr(Count); },
5709 [](
const APInt &Elt,
unsigned Width) {
return APInt::getZero(Width); });
5711 case X86::BI__builtin_ia32_pternlogd128_mask:
5712 case X86::BI__builtin_ia32_pternlogd256_mask:
5713 case X86::BI__builtin_ia32_pternlogd512_mask:
5714 case X86::BI__builtin_ia32_pternlogq128_mask:
5715 case X86::BI__builtin_ia32_pternlogq256_mask:
5716 case X86::BI__builtin_ia32_pternlogq512_mask:
5718 case X86::BI__builtin_ia32_pternlogd128_maskz:
5719 case X86::BI__builtin_ia32_pternlogd256_maskz:
5720 case X86::BI__builtin_ia32_pternlogd512_maskz:
5721 case X86::BI__builtin_ia32_pternlogq128_maskz:
5722 case X86::BI__builtin_ia32_pternlogq256_maskz:
5723 case X86::BI__builtin_ia32_pternlogq512_maskz:
5725 case Builtin::BI__builtin_elementwise_fshl:
5727 llvm::APIntOps::fshl);
5728 case Builtin::BI__builtin_elementwise_fshr:
5730 llvm::APIntOps::fshr);
5732 case X86::BI__builtin_ia32_shuf_f32x4_256:
5733 case X86::BI__builtin_ia32_shuf_i32x4_256:
5734 case X86::BI__builtin_ia32_shuf_f64x2_256:
5735 case X86::BI__builtin_ia32_shuf_i64x2_256:
5736 case X86::BI__builtin_ia32_shuf_f32x4:
5737 case X86::BI__builtin_ia32_shuf_i32x4:
5738 case X86::BI__builtin_ia32_shuf_f64x2:
5739 case X86::BI__builtin_ia32_shuf_i64x2: {
5745 unsigned LaneBits = 128u;
5746 unsigned NumLanes = (NumElems * ElemBits) / LaneBits;
5747 unsigned NumElemsPerLane = LaneBits / ElemBits;
5751 [NumLanes, NumElemsPerLane](
unsigned DstIdx,
unsigned ShuffleMask) {
5753 unsigned BitsPerElem = NumLanes / 2;
5754 unsigned IndexMask = (1u << BitsPerElem) - 1;
5755 unsigned Lane = DstIdx / NumElemsPerLane;
5756 unsigned SrcIdx = (Lane < NumLanes / 2) ? 0 : 1;
5757 unsigned BitIdx = BitsPerElem * Lane;
5758 unsigned SrcLaneIdx = (ShuffleMask >> BitIdx) & IndexMask;
5759 unsigned ElemInLane = DstIdx % NumElemsPerLane;
5760 unsigned IdxToPick = SrcLaneIdx * NumElemsPerLane + ElemInLane;
5761 return std::pair<unsigned, int>{SrcIdx, IdxToPick};
5765 case X86::BI__builtin_ia32_insertf32x4_256:
5766 case X86::BI__builtin_ia32_inserti32x4_256:
5767 case X86::BI__builtin_ia32_insertf64x2_256:
5768 case X86::BI__builtin_ia32_inserti64x2_256:
5769 case X86::BI__builtin_ia32_insertf32x4:
5770 case X86::BI__builtin_ia32_inserti32x4:
5771 case X86::BI__builtin_ia32_insertf64x2_512:
5772 case X86::BI__builtin_ia32_inserti64x2_512:
5773 case X86::BI__builtin_ia32_insertf32x8:
5774 case X86::BI__builtin_ia32_inserti32x8:
5775 case X86::BI__builtin_ia32_insertf64x4:
5776 case X86::BI__builtin_ia32_inserti64x4:
5777 case X86::BI__builtin_ia32_vinsertf128_ps256:
5778 case X86::BI__builtin_ia32_vinsertf128_pd256:
5779 case X86::BI__builtin_ia32_vinsertf128_si256:
5780 case X86::BI__builtin_ia32_insert128i256:
5783 case clang::X86::BI__builtin_ia32_vcvtps2ph:
5784 case clang::X86::BI__builtin_ia32_vcvtps2ph256:
5787 case X86::BI__builtin_ia32_vec_ext_v4hi:
5788 case X86::BI__builtin_ia32_vec_ext_v16qi:
5789 case X86::BI__builtin_ia32_vec_ext_v8hi:
5790 case X86::BI__builtin_ia32_vec_ext_v4si:
5791 case X86::BI__builtin_ia32_vec_ext_v2di:
5792 case X86::BI__builtin_ia32_vec_ext_v32qi:
5793 case X86::BI__builtin_ia32_vec_ext_v16hi:
5794 case X86::BI__builtin_ia32_vec_ext_v8si:
5795 case X86::BI__builtin_ia32_vec_ext_v4di:
5796 case X86::BI__builtin_ia32_vec_ext_v4sf:
5799 case X86::BI__builtin_ia32_vec_set_v4hi:
5800 case X86::BI__builtin_ia32_vec_set_v16qi:
5801 case X86::BI__builtin_ia32_vec_set_v8hi:
5802 case X86::BI__builtin_ia32_vec_set_v4si:
5803 case X86::BI__builtin_ia32_vec_set_v2di:
5804 case X86::BI__builtin_ia32_vec_set_v32qi:
5805 case X86::BI__builtin_ia32_vec_set_v16hi:
5806 case X86::BI__builtin_ia32_vec_set_v8si:
5807 case X86::BI__builtin_ia32_vec_set_v4di:
5810 case X86::BI__builtin_ia32_cvtb2mask128:
5811 case X86::BI__builtin_ia32_cvtb2mask256:
5812 case X86::BI__builtin_ia32_cvtb2mask512:
5813 case X86::BI__builtin_ia32_cvtw2mask128:
5814 case X86::BI__builtin_ia32_cvtw2mask256:
5815 case X86::BI__builtin_ia32_cvtw2mask512:
5816 case X86::BI__builtin_ia32_cvtd2mask128:
5817 case X86::BI__builtin_ia32_cvtd2mask256:
5818 case X86::BI__builtin_ia32_cvtd2mask512:
5819 case X86::BI__builtin_ia32_cvtq2mask128:
5820 case X86::BI__builtin_ia32_cvtq2mask256:
5821 case X86::BI__builtin_ia32_cvtq2mask512:
5824 case X86::BI__builtin_ia32_cvtmask2b128:
5825 case X86::BI__builtin_ia32_cvtmask2b256:
5826 case X86::BI__builtin_ia32_cvtmask2b512:
5827 case X86::BI__builtin_ia32_cvtmask2w128:
5828 case X86::BI__builtin_ia32_cvtmask2w256:
5829 case X86::BI__builtin_ia32_cvtmask2w512:
5830 case X86::BI__builtin_ia32_cvtmask2d128:
5831 case X86::BI__builtin_ia32_cvtmask2d256:
5832 case X86::BI__builtin_ia32_cvtmask2d512:
5833 case X86::BI__builtin_ia32_cvtmask2q128:
5834 case X86::BI__builtin_ia32_cvtmask2q256:
5835 case X86::BI__builtin_ia32_cvtmask2q512:
5838 case X86::BI__builtin_ia32_cvtsd2ss:
5841 case X86::BI__builtin_ia32_cvtsd2ss_round_mask:
5844 case X86::BI__builtin_ia32_cvtpd2ps:
5845 case X86::BI__builtin_ia32_cvtpd2ps256:
5847 case X86::BI__builtin_ia32_cvtpd2ps_mask:
5849 case X86::BI__builtin_ia32_cvtpd2ps512_mask:
5852 case X86::BI__builtin_ia32_cmpb128_mask:
5853 case X86::BI__builtin_ia32_cmpw128_mask:
5854 case X86::BI__builtin_ia32_cmpd128_mask:
5855 case X86::BI__builtin_ia32_cmpq128_mask:
5856 case X86::BI__builtin_ia32_cmpb256_mask:
5857 case X86::BI__builtin_ia32_cmpw256_mask:
5858 case X86::BI__builtin_ia32_cmpd256_mask:
5859 case X86::BI__builtin_ia32_cmpq256_mask:
5860 case X86::BI__builtin_ia32_cmpb512_mask:
5861 case X86::BI__builtin_ia32_cmpw512_mask:
5862 case X86::BI__builtin_ia32_cmpd512_mask:
5863 case X86::BI__builtin_ia32_cmpq512_mask:
5867 case X86::BI__builtin_ia32_ucmpb128_mask:
5868 case X86::BI__builtin_ia32_ucmpw128_mask:
5869 case X86::BI__builtin_ia32_ucmpd128_mask:
5870 case X86::BI__builtin_ia32_ucmpq128_mask:
5871 case X86::BI__builtin_ia32_ucmpb256_mask:
5872 case X86::BI__builtin_ia32_ucmpw256_mask:
5873 case X86::BI__builtin_ia32_ucmpd256_mask:
5874 case X86::BI__builtin_ia32_ucmpq256_mask:
5875 case X86::BI__builtin_ia32_ucmpb512_mask:
5876 case X86::BI__builtin_ia32_ucmpw512_mask:
5877 case X86::BI__builtin_ia32_ucmpd512_mask:
5878 case X86::BI__builtin_ia32_ucmpq512_mask:
5882 case X86::BI__builtin_ia32_vpshufbitqmb128_mask:
5883 case X86::BI__builtin_ia32_vpshufbitqmb256_mask:
5884 case X86::BI__builtin_ia32_vpshufbitqmb512_mask:
5887 case X86::BI__builtin_ia32_pslldqi128_byteshift:
5888 case X86::BI__builtin_ia32_pslldqi256_byteshift:
5889 case X86::BI__builtin_ia32_pslldqi512_byteshift:
5896 [](
unsigned DstIdx,
unsigned Shift) -> std::pair<unsigned, int> {
5897 unsigned LaneBase = (DstIdx / 16) * 16;
5898 unsigned LaneIdx = DstIdx % 16;
5899 if (LaneIdx < Shift)
5900 return std::make_pair(0, -1);
5902 return std::make_pair(0,
5903 static_cast<int>(LaneBase + LaneIdx - Shift));
5906 case X86::BI__builtin_ia32_psrldqi128_byteshift:
5907 case X86::BI__builtin_ia32_psrldqi256_byteshift:
5908 case X86::BI__builtin_ia32_psrldqi512_byteshift:
5915 [](
unsigned DstIdx,
unsigned Shift) -> std::pair<unsigned, int> {
5916 unsigned LaneBase = (DstIdx / 16) * 16;
5917 unsigned LaneIdx = DstIdx % 16;
5918 if (LaneIdx + Shift < 16)
5919 return std::make_pair(0,
5920 static_cast<int>(LaneBase + LaneIdx + Shift));
5922 return std::make_pair(0, -1);
5925 case X86::BI__builtin_ia32_palignr128:
5926 case X86::BI__builtin_ia32_palignr256:
5927 case X86::BI__builtin_ia32_palignr512:
5929 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned Shift) {
5931 unsigned VecIdx = 1;
5934 int Lane = DstIdx / 16;
5935 int Offset = DstIdx % 16;
5938 unsigned ShiftedIdx = Offset + (Shift & 0xFF);
5939 if (ShiftedIdx < 16) {
5940 ElemIdx = ShiftedIdx + (Lane * 16);
5941 }
else if (ShiftedIdx < 32) {
5943 ElemIdx = (ShiftedIdx - 16) + (Lane * 16);
5946 return std::pair<unsigned, int>{VecIdx, ElemIdx};
5949 case X86::BI__builtin_ia32_alignd128:
5950 case X86::BI__builtin_ia32_alignd256:
5951 case X86::BI__builtin_ia32_alignd512:
5952 case X86::BI__builtin_ia32_alignq128:
5953 case X86::BI__builtin_ia32_alignq256:
5954 case X86::BI__builtin_ia32_alignq512: {
5955 unsigned NumElems =
Call->getType()->castAs<
VectorType>()->getNumElements();
5957 S, OpPC,
Call, [NumElems](
unsigned DstIdx,
unsigned Shift) {
5958 unsigned Imm = Shift & 0xFF;
5959 unsigned EffectiveShift = Imm & (NumElems - 1);
5960 unsigned SourcePos = DstIdx + EffectiveShift;
5961 unsigned VecIdx = SourcePos < NumElems ? 1u : 0u;
5962 unsigned ElemIdx = SourcePos & (NumElems - 1);
5963 return std::pair<unsigned, int>{VecIdx,
static_cast<int>(ElemIdx)};
5967 case clang::X86::BI__builtin_ia32_minps:
5968 case clang::X86::BI__builtin_ia32_minpd:
5969 case clang::X86::BI__builtin_ia32_minph128:
5970 case clang::X86::BI__builtin_ia32_minph256:
5971 case clang::X86::BI__builtin_ia32_minps256:
5972 case clang::X86::BI__builtin_ia32_minpd256:
5973 case clang::X86::BI__builtin_ia32_minps512:
5974 case clang::X86::BI__builtin_ia32_minpd512:
5975 case clang::X86::BI__builtin_ia32_minph512:
5979 std::optional<APSInt>) -> std::optional<APFloat> {
5980 if (A.isNaN() || A.isInfinity() || A.isDenormal() || B.isNaN() ||
5981 B.isInfinity() || B.isDenormal())
5982 return std::nullopt;
5983 if (A.isZero() && B.isZero())
5985 return llvm::minimum(A, B);
5988 case clang::X86::BI__builtin_ia32_minss:
5989 case clang::X86::BI__builtin_ia32_minsd:
5993 std::optional<APSInt> RoundingMode) -> std::optional<APFloat> {
5998 case clang::X86::BI__builtin_ia32_minsd_round_mask:
5999 case clang::X86::BI__builtin_ia32_minss_round_mask:
6000 case clang::X86::BI__builtin_ia32_minsh_round_mask:
6001 case clang::X86::BI__builtin_ia32_maxsd_round_mask:
6002 case clang::X86::BI__builtin_ia32_maxss_round_mask:
6003 case clang::X86::BI__builtin_ia32_maxsh_round_mask: {
6004 bool IsMin = BuiltinID == clang::X86::BI__builtin_ia32_minsd_round_mask ||
6005 BuiltinID == clang::X86::BI__builtin_ia32_minss_round_mask ||
6006 BuiltinID == clang::X86::BI__builtin_ia32_minsh_round_mask;
6010 std::optional<APSInt> RoundingMode) -> std::optional<APFloat> {
6015 case clang::X86::BI__builtin_ia32_maxps:
6016 case clang::X86::BI__builtin_ia32_maxpd:
6017 case clang::X86::BI__builtin_ia32_maxph128:
6018 case clang::X86::BI__builtin_ia32_maxph256:
6019 case clang::X86::BI__builtin_ia32_maxps256:
6020 case clang::X86::BI__builtin_ia32_maxpd256:
6021 case clang::X86::BI__builtin_ia32_maxps512:
6022 case clang::X86::BI__builtin_ia32_maxpd512:
6023 case clang::X86::BI__builtin_ia32_maxph512:
6027 std::optional<APSInt>) -> std::optional<APFloat> {
6028 if (A.isNaN() || A.isInfinity() || A.isDenormal() || B.isNaN() ||
6029 B.isInfinity() || B.isDenormal())
6030 return std::nullopt;
6031 if (A.isZero() && B.isZero())
6033 return llvm::maximum(A, B);
6036 case clang::X86::BI__builtin_ia32_maxss:
6037 case clang::X86::BI__builtin_ia32_maxsd:
6041 std::optional<APSInt> RoundingMode) -> std::optional<APFloat> {
6048 diag::note_invalid_subexpr_in_const_expr)
6054 llvm_unreachable(
"Unhandled builtin ID");