4193 uint32_t BuiltinID) {
4198 switch (BuiltinID) {
4199 case Builtin::BI__builtin_is_constant_evaluated:
4202 case Builtin::BI__builtin_assume:
4203 case Builtin::BI__assume:
4206 case Builtin::BI__builtin_strcmp:
4207 case Builtin::BIstrcmp:
4208 case Builtin::BI__builtin_strncmp:
4209 case Builtin::BIstrncmp:
4210 case Builtin::BI__builtin_wcsncmp:
4211 case Builtin::BIwcsncmp:
4212 case Builtin::BI__builtin_wcscmp:
4213 case Builtin::BIwcscmp:
4216 case Builtin::BI__builtin_strlen:
4217 case Builtin::BIstrlen:
4218 case Builtin::BI__builtin_wcslen:
4219 case Builtin::BIwcslen:
4222 case Builtin::BI__builtin_nan:
4223 case Builtin::BI__builtin_nanf:
4224 case Builtin::BI__builtin_nanl:
4225 case Builtin::BI__builtin_nanf16:
4226 case Builtin::BI__builtin_nanf128:
4229 case Builtin::BI__builtin_nans:
4230 case Builtin::BI__builtin_nansf:
4231 case Builtin::BI__builtin_nansl:
4232 case Builtin::BI__builtin_nansf16:
4233 case Builtin::BI__builtin_nansf128:
4236 case Builtin::BI__builtin_huge_val:
4237 case Builtin::BI__builtin_huge_valf:
4238 case Builtin::BI__builtin_huge_vall:
4239 case Builtin::BI__builtin_huge_valf16:
4240 case Builtin::BI__builtin_huge_valf128:
4241 case Builtin::BI__builtin_inf:
4242 case Builtin::BI__builtin_inff:
4243 case Builtin::BI__builtin_infl:
4244 case Builtin::BI__builtin_inff16:
4245 case Builtin::BI__builtin_inff128:
4248 case Builtin::BI__builtin_copysign:
4249 case Builtin::BI__builtin_copysignf:
4250 case Builtin::BI__builtin_copysignl:
4251 case Builtin::BI__builtin_copysignf128:
4254 case Builtin::BI__builtin_fmin:
4255 case Builtin::BI__builtin_fminf:
4256 case Builtin::BI__builtin_fminl:
4257 case Builtin::BI__builtin_fminf16:
4258 case Builtin::BI__builtin_fminf128:
4261 case Builtin::BI__builtin_fminimum_num:
4262 case Builtin::BI__builtin_fminimum_numf:
4263 case Builtin::BI__builtin_fminimum_numl:
4264 case Builtin::BI__builtin_fminimum_numf16:
4265 case Builtin::BI__builtin_fminimum_numf128:
4268 case Builtin::BI__builtin_fmax:
4269 case Builtin::BI__builtin_fmaxf:
4270 case Builtin::BI__builtin_fmaxl:
4271 case Builtin::BI__builtin_fmaxf16:
4272 case Builtin::BI__builtin_fmaxf128:
4275 case Builtin::BI__builtin_fmaximum_num:
4276 case Builtin::BI__builtin_fmaximum_numf:
4277 case Builtin::BI__builtin_fmaximum_numl:
4278 case Builtin::BI__builtin_fmaximum_numf16:
4279 case Builtin::BI__builtin_fmaximum_numf128:
4282 case Builtin::BI__builtin_isnan:
4285 case Builtin::BI__builtin_issignaling:
4288 case Builtin::BI__builtin_isinf:
4291 case Builtin::BI__builtin_isinf_sign:
4294 case Builtin::BI__builtin_isfinite:
4297 case Builtin::BI__builtin_isnormal:
4300 case Builtin::BI__builtin_issubnormal:
4303 case Builtin::BI__builtin_iszero:
4306 case Builtin::BI__builtin_signbit:
4307 case Builtin::BI__builtin_signbitf:
4308 case Builtin::BI__builtin_signbitl:
4311 case Builtin::BI__builtin_isgreater:
4312 case Builtin::BI__builtin_isgreaterequal:
4313 case Builtin::BI__builtin_isless:
4314 case Builtin::BI__builtin_islessequal:
4315 case Builtin::BI__builtin_islessgreater:
4316 case Builtin::BI__builtin_isunordered:
4319 case Builtin::BI__builtin_isfpclass:
4322 case Builtin::BI__builtin_fpclassify:
4325 case Builtin::BI__builtin_fabs:
4326 case Builtin::BI__builtin_fabsf:
4327 case Builtin::BI__builtin_fabsl:
4328 case Builtin::BI__builtin_fabsf128:
4331 case Builtin::BI__builtin_abs:
4332 case Builtin::BI__builtin_labs:
4333 case Builtin::BI__builtin_llabs:
4336 case Builtin::BI__builtin_popcount:
4337 case Builtin::BI__builtin_popcountl:
4338 case Builtin::BI__builtin_popcountll:
4339 case Builtin::BI__builtin_popcountg:
4340 case Builtin::BI__popcnt16:
4341 case Builtin::BI__popcnt:
4342 case Builtin::BI__popcnt64:
4345 case Builtin::BI__builtin_parity:
4346 case Builtin::BI__builtin_parityl:
4347 case Builtin::BI__builtin_parityll:
4350 return APInt(Val.getBitWidth(), Val.popcount() % 2);
4352 case Builtin::BI__builtin_clrsb:
4353 case Builtin::BI__builtin_clrsbl:
4354 case Builtin::BI__builtin_clrsbll:
4357 return APInt(Val.getBitWidth(),
4358 Val.getBitWidth() - Val.getSignificantBits());
4360 case Builtin::BI__builtin_bitreverseg:
4361 case Builtin::BI__builtin_bitreverse8:
4362 case Builtin::BI__builtin_bitreverse16:
4363 case Builtin::BI__builtin_bitreverse32:
4364 case Builtin::BI__builtin_bitreverse64:
4366 S, OpPC,
Call, [](
const APSInt &Val) {
return Val.reverseBits(); });
4368 case Builtin::BI__builtin_classify_type:
4371 case Builtin::BI__builtin_expect:
4372 case Builtin::BI__builtin_expect_with_probability:
4375 case Builtin::BI__builtin_rotateleft8:
4376 case Builtin::BI__builtin_rotateleft16:
4377 case Builtin::BI__builtin_rotateleft32:
4378 case Builtin::BI__builtin_rotateleft64:
4379 case Builtin::BI__builtin_stdc_rotate_left:
4380 case Builtin::BI_rotl8:
4381 case Builtin::BI_rotl16:
4382 case Builtin::BI_rotl:
4383 case Builtin::BI_lrotl:
4384 case Builtin::BI_rotl64:
4385 case Builtin::BI__builtin_rotateright8:
4386 case Builtin::BI__builtin_rotateright16:
4387 case Builtin::BI__builtin_rotateright32:
4388 case Builtin::BI__builtin_rotateright64:
4389 case Builtin::BI__builtin_stdc_rotate_right:
4390 case Builtin::BI_rotr8:
4391 case Builtin::BI_rotr16:
4392 case Builtin::BI_rotr:
4393 case Builtin::BI_lrotr:
4394 case Builtin::BI_rotr64: {
4397 switch (BuiltinID) {
4398 case Builtin::BI__builtin_rotateright8:
4399 case Builtin::BI__builtin_rotateright16:
4400 case Builtin::BI__builtin_rotateright32:
4401 case Builtin::BI__builtin_rotateright64:
4402 case Builtin::BI__builtin_stdc_rotate_right:
4403 case Builtin::BI_rotr8:
4404 case Builtin::BI_rotr16:
4405 case Builtin::BI_rotr:
4406 case Builtin::BI_lrotr:
4407 case Builtin::BI_rotr64:
4408 IsRotateRight =
true;
4411 IsRotateRight =
false;
4418 return IsRotateRight ?
Value.rotr(Amount.getZExtValue())
4419 :
Value.rotl(Amount.getZExtValue());
4423 case Builtin::BI__builtin_ffs:
4424 case Builtin::BI__builtin_ffsl:
4425 case Builtin::BI__builtin_ffsll:
4428 return APInt(Val.getBitWidth(),
4429 Val.isZero() ? 0u : Val.countTrailingZeros() + 1u);
4432 case Builtin::BIaddressof:
4433 case Builtin::BI__addressof:
4434 case Builtin::BI__builtin_addressof:
4438 case Builtin::BIas_const:
4439 case Builtin::BIforward:
4440 case Builtin::BIforward_like:
4441 case Builtin::BImove:
4442 case Builtin::BImove_if_noexcept:
4446 case Builtin::BI__builtin_eh_return_data_regno:
4449 case Builtin::BI__builtin_launder:
4453 case Builtin::BI__builtin_add_overflow:
4454 case Builtin::BI__builtin_sub_overflow:
4455 case Builtin::BI__builtin_mul_overflow:
4456 case Builtin::BI__builtin_sadd_overflow:
4457 case Builtin::BI__builtin_uadd_overflow:
4458 case Builtin::BI__builtin_uaddl_overflow:
4459 case Builtin::BI__builtin_uaddll_overflow:
4460 case Builtin::BI__builtin_usub_overflow:
4461 case Builtin::BI__builtin_usubl_overflow:
4462 case Builtin::BI__builtin_usubll_overflow:
4463 case Builtin::BI__builtin_umul_overflow:
4464 case Builtin::BI__builtin_umull_overflow:
4465 case Builtin::BI__builtin_umulll_overflow:
4466 case Builtin::BI__builtin_saddl_overflow:
4467 case Builtin::BI__builtin_saddll_overflow:
4468 case Builtin::BI__builtin_ssub_overflow:
4469 case Builtin::BI__builtin_ssubl_overflow:
4470 case Builtin::BI__builtin_ssubll_overflow:
4471 case Builtin::BI__builtin_smul_overflow:
4472 case Builtin::BI__builtin_smull_overflow:
4473 case Builtin::BI__builtin_smulll_overflow:
4476 case Builtin::BI__builtin_addcb:
4477 case Builtin::BI__builtin_addcs:
4478 case Builtin::BI__builtin_addc:
4479 case Builtin::BI__builtin_addcl:
4480 case Builtin::BI__builtin_addcll:
4481 case Builtin::BI__builtin_subcb:
4482 case Builtin::BI__builtin_subcs:
4483 case Builtin::BI__builtin_subc:
4484 case Builtin::BI__builtin_subcl:
4485 case Builtin::BI__builtin_subcll:
4488 case Builtin::BI__builtin_clz:
4489 case Builtin::BI__builtin_clzl:
4490 case Builtin::BI__builtin_clzll:
4491 case Builtin::BI__builtin_clzs:
4492 case Builtin::BI__builtin_clzg:
4493 case Builtin::BI__lzcnt16:
4494 case Builtin::BI__lzcnt:
4495 case Builtin::BI__lzcnt64:
4498 case Builtin::BI__builtin_ctz:
4499 case Builtin::BI__builtin_ctzl:
4500 case Builtin::BI__builtin_ctzll:
4501 case Builtin::BI__builtin_ctzs:
4502 case Builtin::BI__builtin_ctzg:
4505 case Builtin::BI__builtin_elementwise_clzg:
4506 case Builtin::BI__builtin_elementwise_ctzg:
4509 case Builtin::BI__builtin_bswapg:
4510 case Builtin::BI__builtin_bswap16:
4511 case Builtin::BI__builtin_bswap32:
4512 case Builtin::BI__builtin_bswap64:
4515 case Builtin::BI__atomic_always_lock_free:
4516 case Builtin::BI__atomic_is_lock_free:
4519 case Builtin::BI__c11_atomic_is_lock_free:
4522 case Builtin::BI__builtin_complex:
4525 case Builtin::BI__builtin_is_aligned:
4526 case Builtin::BI__builtin_align_up:
4527 case Builtin::BI__builtin_align_down:
4530 case Builtin::BI__builtin_assume_aligned:
4533 case clang::X86::BI__builtin_ia32_crc32qi:
4535 case clang::X86::BI__builtin_ia32_crc32hi:
4537 case clang::X86::BI__builtin_ia32_crc32si:
4539 case clang::X86::BI__builtin_ia32_crc32di:
4542 case clang::X86::BI__builtin_ia32_bextr_u32:
4543 case clang::X86::BI__builtin_ia32_bextr_u64:
4544 case clang::X86::BI__builtin_ia32_bextri_u32:
4545 case clang::X86::BI__builtin_ia32_bextri_u64:
4548 unsigned BitWidth = Val.getBitWidth();
4549 uint64_t Shift = Idx.extractBitsAsZExtValue(8, 0);
4550 uint64_t Length = Idx.extractBitsAsZExtValue(8, 8);
4551 if (Length > BitWidth) {
4556 if (Length == 0 || Shift >= BitWidth)
4557 return APInt(BitWidth, 0);
4559 uint64_t
Result = Val.getZExtValue() >> Shift;
4560 Result &= llvm::maskTrailingOnes<uint64_t>(Length);
4564 case clang::X86::BI__builtin_ia32_bzhi_si:
4565 case clang::X86::BI__builtin_ia32_bzhi_di:
4568 unsigned BitWidth = Val.getBitWidth();
4569 uint64_t Index = Idx.extractBitsAsZExtValue(8, 0);
4572 if (Index < BitWidth)
4573 Result.clearHighBits(BitWidth - Index);
4578 case clang::X86::BI__builtin_ia32_ktestcqi:
4579 case clang::X86::BI__builtin_ia32_ktestchi:
4580 case clang::X86::BI__builtin_ia32_ktestcsi:
4581 case clang::X86::BI__builtin_ia32_ktestcdi:
4584 return APInt(
sizeof(
unsigned char) * 8, (~A & B) == 0);
4587 case clang::X86::BI__builtin_ia32_ktestzqi:
4588 case clang::X86::BI__builtin_ia32_ktestzhi:
4589 case clang::X86::BI__builtin_ia32_ktestzsi:
4590 case clang::X86::BI__builtin_ia32_ktestzdi:
4593 return APInt(
sizeof(
unsigned char) * 8, (A & B) == 0);
4596 case clang::X86::BI__builtin_ia32_kortestcqi:
4597 case clang::X86::BI__builtin_ia32_kortestchi:
4598 case clang::X86::BI__builtin_ia32_kortestcsi:
4599 case clang::X86::BI__builtin_ia32_kortestcdi:
4602 return APInt(
sizeof(
unsigned char) * 8, ~(A | B) == 0);
4605 case clang::X86::BI__builtin_ia32_kortestzqi:
4606 case clang::X86::BI__builtin_ia32_kortestzhi:
4607 case clang::X86::BI__builtin_ia32_kortestzsi:
4608 case clang::X86::BI__builtin_ia32_kortestzdi:
4611 return APInt(
sizeof(
unsigned char) * 8, (A | B) == 0);
4614 case clang::X86::BI__builtin_ia32_kshiftliqi:
4615 case clang::X86::BI__builtin_ia32_kshiftlihi:
4616 case clang::X86::BI__builtin_ia32_kshiftlisi:
4617 case clang::X86::BI__builtin_ia32_kshiftlidi:
4620 unsigned Amt = RHS.getZExtValue() & 0xFF;
4621 if (Amt >= LHS.getBitWidth())
4622 return APInt::getZero(LHS.getBitWidth());
4623 return LHS.shl(Amt);
4626 case clang::X86::BI__builtin_ia32_kshiftriqi:
4627 case clang::X86::BI__builtin_ia32_kshiftrihi:
4628 case clang::X86::BI__builtin_ia32_kshiftrisi:
4629 case clang::X86::BI__builtin_ia32_kshiftridi:
4632 unsigned Amt = RHS.getZExtValue() & 0xFF;
4633 if (Amt >= LHS.getBitWidth())
4634 return APInt::getZero(LHS.getBitWidth());
4635 return LHS.lshr(Amt);
4638 case clang::X86::BI__builtin_ia32_lzcnt_u16:
4639 case clang::X86::BI__builtin_ia32_lzcnt_u32:
4640 case clang::X86::BI__builtin_ia32_lzcnt_u64:
4643 return APInt(Src.getBitWidth(), Src.countLeadingZeros());
4646 case clang::X86::BI__builtin_ia32_tzcnt_u16:
4647 case clang::X86::BI__builtin_ia32_tzcnt_u32:
4648 case clang::X86::BI__builtin_ia32_tzcnt_u64:
4651 return APInt(Src.getBitWidth(), Src.countTrailingZeros());
4654 case clang::X86::BI__builtin_ia32_pdep_si:
4655 case clang::X86::BI__builtin_ia32_pdep_di:
4658 unsigned BitWidth = Val.getBitWidth();
4661 for (
unsigned I = 0, P = 0; I != BitWidth; ++I) {
4663 Result.setBitVal(I, Val[P++]);
4669 case clang::X86::BI__builtin_ia32_pext_si:
4670 case clang::X86::BI__builtin_ia32_pext_di:
4673 unsigned BitWidth = Val.getBitWidth();
4676 for (
unsigned I = 0, P = 0; I != BitWidth; ++I) {
4678 Result.setBitVal(P++, Val[I]);
4684 case clang::X86::BI__builtin_ia32_addcarryx_u32:
4685 case clang::X86::BI__builtin_ia32_addcarryx_u64:
4686 case clang::X86::BI__builtin_ia32_subborrow_u32:
4687 case clang::X86::BI__builtin_ia32_subborrow_u64:
4691 case Builtin::BI__builtin_os_log_format_buffer_size:
4694 case Builtin::BI__builtin_ptrauth_string_discriminator:
4697 case Builtin::BI__builtin_infer_alloc_token:
4700 case Builtin::BI__noop:
4704 case Builtin::BI__builtin_operator_new:
4707 case Builtin::BI__builtin_operator_delete:
4710 case Builtin::BI__arithmetic_fence:
4713 case Builtin::BI__builtin_reduce_add:
4714 case Builtin::BI__builtin_reduce_mul:
4715 case Builtin::BI__builtin_reduce_and:
4716 case Builtin::BI__builtin_reduce_or:
4717 case Builtin::BI__builtin_reduce_xor:
4718 case Builtin::BI__builtin_reduce_min:
4719 case Builtin::BI__builtin_reduce_max:
4722 case Builtin::BI__builtin_elementwise_popcount:
4725 return APInt(Src.getBitWidth(), Src.popcount());
4727 case Builtin::BI__builtin_elementwise_bitreverse:
4729 S, OpPC,
Call, [](
const APSInt &Src) {
return Src.reverseBits(); });
4731 case Builtin::BI__builtin_elementwise_abs:
4734 case Builtin::BI__builtin_memcpy:
4735 case Builtin::BImemcpy:
4736 case Builtin::BI__builtin_wmemcpy:
4737 case Builtin::BIwmemcpy:
4738 case Builtin::BI__builtin_memmove:
4739 case Builtin::BImemmove:
4740 case Builtin::BI__builtin_wmemmove:
4741 case Builtin::BIwmemmove:
4744 case Builtin::BI__builtin_memcmp:
4745 case Builtin::BImemcmp:
4746 case Builtin::BI__builtin_bcmp:
4747 case Builtin::BIbcmp:
4748 case Builtin::BI__builtin_wmemcmp:
4749 case Builtin::BIwmemcmp:
4752 case Builtin::BImemchr:
4753 case Builtin::BI__builtin_memchr:
4754 case Builtin::BIstrchr:
4755 case Builtin::BI__builtin_strchr:
4756 case Builtin::BIwmemchr:
4757 case Builtin::BI__builtin_wmemchr:
4758 case Builtin::BIwcschr:
4759 case Builtin::BI__builtin_wcschr:
4760 case Builtin::BI__builtin_char_memchr:
4763 case Builtin::BI__builtin_object_size:
4764 case Builtin::BI__builtin_dynamic_object_size:
4767 case Builtin::BI__builtin_is_within_lifetime:
4770 case Builtin::BI__builtin_elementwise_add_sat:
4773 return LHS.isSigned() ? LHS.sadd_sat(RHS) : LHS.uadd_sat(RHS);
4776 case Builtin::BI__builtin_elementwise_sub_sat:
4779 return LHS.isSigned() ? LHS.ssub_sat(RHS) : LHS.usub_sat(RHS);
4781 case X86::BI__builtin_ia32_extract128i256:
4782 case X86::BI__builtin_ia32_vextractf128_pd256:
4783 case X86::BI__builtin_ia32_vextractf128_ps256:
4784 case X86::BI__builtin_ia32_vextractf128_si256:
4787 case X86::BI__builtin_ia32_extractf32x4_256_mask:
4788 case X86::BI__builtin_ia32_extractf32x4_mask:
4789 case X86::BI__builtin_ia32_extractf32x8_mask:
4790 case X86::BI__builtin_ia32_extractf64x2_256_mask:
4791 case X86::BI__builtin_ia32_extractf64x2_512_mask:
4792 case X86::BI__builtin_ia32_extractf64x4_mask:
4793 case X86::BI__builtin_ia32_extracti32x4_256_mask:
4794 case X86::BI__builtin_ia32_extracti32x4_mask:
4795 case X86::BI__builtin_ia32_extracti32x8_mask:
4796 case X86::BI__builtin_ia32_extracti64x2_256_mask:
4797 case X86::BI__builtin_ia32_extracti64x2_512_mask:
4798 case X86::BI__builtin_ia32_extracti64x4_mask:
4801 case clang::X86::BI__builtin_ia32_pmulhrsw128:
4802 case clang::X86::BI__builtin_ia32_pmulhrsw256:
4803 case clang::X86::BI__builtin_ia32_pmulhrsw512:
4806 return (llvm::APIntOps::mulsExtended(LHS, RHS).ashr(14) + 1)
4807 .extractBits(16, 1);
4810 case clang::X86::BI__builtin_ia32_movmskps:
4811 case clang::X86::BI__builtin_ia32_movmskpd:
4812 case clang::X86::BI__builtin_ia32_pmovmskb128:
4813 case clang::X86::BI__builtin_ia32_pmovmskb256:
4814 case clang::X86::BI__builtin_ia32_movmskps256:
4815 case clang::X86::BI__builtin_ia32_movmskpd256: {
4819 case X86::BI__builtin_ia32_psignb128:
4820 case X86::BI__builtin_ia32_psignb256:
4821 case X86::BI__builtin_ia32_psignw128:
4822 case X86::BI__builtin_ia32_psignw256:
4823 case X86::BI__builtin_ia32_psignd128:
4824 case X86::BI__builtin_ia32_psignd256:
4828 return APInt::getZero(AElem.getBitWidth());
4829 if (BElem.isNegative())
4834 case clang::X86::BI__builtin_ia32_pavgb128:
4835 case clang::X86::BI__builtin_ia32_pavgw128:
4836 case clang::X86::BI__builtin_ia32_pavgb256:
4837 case clang::X86::BI__builtin_ia32_pavgw256:
4838 case clang::X86::BI__builtin_ia32_pavgb512:
4839 case clang::X86::BI__builtin_ia32_pavgw512:
4841 llvm::APIntOps::avgCeilU);
4843 case clang::X86::BI__builtin_ia32_pmaddubsw128:
4844 case clang::X86::BI__builtin_ia32_pmaddubsw256:
4845 case clang::X86::BI__builtin_ia32_pmaddubsw512:
4850 unsigned BitWidth = 2 * LoLHS.getBitWidth();
4851 return (LoLHS.zext(BitWidth) * LoRHS.sext(BitWidth))
4852 .sadd_sat((HiLHS.zext(BitWidth) * HiRHS.sext(BitWidth)));
4855 case clang::X86::BI__builtin_ia32_pmaddwd128:
4856 case clang::X86::BI__builtin_ia32_pmaddwd256:
4857 case clang::X86::BI__builtin_ia32_pmaddwd512:
4862 unsigned BitWidth = 2 * LoLHS.getBitWidth();
4863 return (LoLHS.sext(BitWidth) * LoRHS.sext(BitWidth)) +
4864 (HiLHS.sext(BitWidth) * HiRHS.sext(BitWidth));
4867 case clang::X86::BI__builtin_ia32_pmulhuw128:
4868 case clang::X86::BI__builtin_ia32_pmulhuw256:
4869 case clang::X86::BI__builtin_ia32_pmulhuw512:
4871 llvm::APIntOps::mulhu);
4873 case clang::X86::BI__builtin_ia32_pmulhw128:
4874 case clang::X86::BI__builtin_ia32_pmulhw256:
4875 case clang::X86::BI__builtin_ia32_pmulhw512:
4877 llvm::APIntOps::mulhs);
4879 case clang::X86::BI__builtin_ia32_psllv2di:
4880 case clang::X86::BI__builtin_ia32_psllv4di:
4881 case clang::X86::BI__builtin_ia32_psllv4si:
4882 case clang::X86::BI__builtin_ia32_psllv8di:
4883 case clang::X86::BI__builtin_ia32_psllv8hi:
4884 case clang::X86::BI__builtin_ia32_psllv8si:
4885 case clang::X86::BI__builtin_ia32_psllv16hi:
4886 case clang::X86::BI__builtin_ia32_psllv16si:
4887 case clang::X86::BI__builtin_ia32_psllv32hi:
4888 case clang::X86::BI__builtin_ia32_psllwi128:
4889 case clang::X86::BI__builtin_ia32_psllwi256:
4890 case clang::X86::BI__builtin_ia32_psllwi512:
4891 case clang::X86::BI__builtin_ia32_pslldi128:
4892 case clang::X86::BI__builtin_ia32_pslldi256:
4893 case clang::X86::BI__builtin_ia32_pslldi512:
4894 case clang::X86::BI__builtin_ia32_psllqi128:
4895 case clang::X86::BI__builtin_ia32_psllqi256:
4896 case clang::X86::BI__builtin_ia32_psllqi512:
4899 if (RHS.uge(LHS.getBitWidth())) {
4900 return APInt::getZero(LHS.getBitWidth());
4902 return LHS.shl(RHS.getZExtValue());
4905 case clang::X86::BI__builtin_ia32_psrav4si:
4906 case clang::X86::BI__builtin_ia32_psrav8di:
4907 case clang::X86::BI__builtin_ia32_psrav8hi:
4908 case clang::X86::BI__builtin_ia32_psrav8si:
4909 case clang::X86::BI__builtin_ia32_psrav16hi:
4910 case clang::X86::BI__builtin_ia32_psrav16si:
4911 case clang::X86::BI__builtin_ia32_psrav32hi:
4912 case clang::X86::BI__builtin_ia32_psravq128:
4913 case clang::X86::BI__builtin_ia32_psravq256:
4914 case clang::X86::BI__builtin_ia32_psrawi128:
4915 case clang::X86::BI__builtin_ia32_psrawi256:
4916 case clang::X86::BI__builtin_ia32_psrawi512:
4917 case clang::X86::BI__builtin_ia32_psradi128:
4918 case clang::X86::BI__builtin_ia32_psradi256:
4919 case clang::X86::BI__builtin_ia32_psradi512:
4920 case clang::X86::BI__builtin_ia32_psraqi128:
4921 case clang::X86::BI__builtin_ia32_psraqi256:
4922 case clang::X86::BI__builtin_ia32_psraqi512:
4925 if (RHS.uge(LHS.getBitWidth())) {
4926 return LHS.ashr(LHS.getBitWidth() - 1);
4928 return LHS.ashr(RHS.getZExtValue());
4931 case clang::X86::BI__builtin_ia32_psrlv2di:
4932 case clang::X86::BI__builtin_ia32_psrlv4di:
4933 case clang::X86::BI__builtin_ia32_psrlv4si:
4934 case clang::X86::BI__builtin_ia32_psrlv8di:
4935 case clang::X86::BI__builtin_ia32_psrlv8hi:
4936 case clang::X86::BI__builtin_ia32_psrlv8si:
4937 case clang::X86::BI__builtin_ia32_psrlv16hi:
4938 case clang::X86::BI__builtin_ia32_psrlv16si:
4939 case clang::X86::BI__builtin_ia32_psrlv32hi:
4940 case clang::X86::BI__builtin_ia32_psrlwi128:
4941 case clang::X86::BI__builtin_ia32_psrlwi256:
4942 case clang::X86::BI__builtin_ia32_psrlwi512:
4943 case clang::X86::BI__builtin_ia32_psrldi128:
4944 case clang::X86::BI__builtin_ia32_psrldi256:
4945 case clang::X86::BI__builtin_ia32_psrldi512:
4946 case clang::X86::BI__builtin_ia32_psrlqi128:
4947 case clang::X86::BI__builtin_ia32_psrlqi256:
4948 case clang::X86::BI__builtin_ia32_psrlqi512:
4951 if (RHS.uge(LHS.getBitWidth())) {
4952 return APInt::getZero(LHS.getBitWidth());
4954 return LHS.lshr(RHS.getZExtValue());
4956 case clang::X86::BI__builtin_ia32_packsswb128:
4957 case clang::X86::BI__builtin_ia32_packsswb256:
4958 case clang::X86::BI__builtin_ia32_packsswb512:
4959 case clang::X86::BI__builtin_ia32_packssdw128:
4960 case clang::X86::BI__builtin_ia32_packssdw256:
4961 case clang::X86::BI__builtin_ia32_packssdw512:
4963 return APInt(Src).truncSSat(Src.getBitWidth() / 2);
4965 case clang::X86::BI__builtin_ia32_packusdw128:
4966 case clang::X86::BI__builtin_ia32_packusdw256:
4967 case clang::X86::BI__builtin_ia32_packusdw512:
4968 case clang::X86::BI__builtin_ia32_packuswb128:
4969 case clang::X86::BI__builtin_ia32_packuswb256:
4970 case clang::X86::BI__builtin_ia32_packuswb512:
4972 return APInt(Src).truncSSatU(Src.getBitWidth() / 2);
4975 case clang::X86::BI__builtin_ia32_selectss_128:
4976 case clang::X86::BI__builtin_ia32_selectsd_128:
4977 case clang::X86::BI__builtin_ia32_selectsh_128:
4978 case clang::X86::BI__builtin_ia32_selectsbf_128:
4980 case clang::X86::BI__builtin_ia32_vprotbi:
4981 case clang::X86::BI__builtin_ia32_vprotdi:
4982 case clang::X86::BI__builtin_ia32_vprotqi:
4983 case clang::X86::BI__builtin_ia32_vprotwi:
4984 case clang::X86::BI__builtin_ia32_prold128:
4985 case clang::X86::BI__builtin_ia32_prold256:
4986 case clang::X86::BI__builtin_ia32_prold512:
4987 case clang::X86::BI__builtin_ia32_prolq128:
4988 case clang::X86::BI__builtin_ia32_prolq256:
4989 case clang::X86::BI__builtin_ia32_prolq512:
4992 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS.rotl(RHS); });
4994 case clang::X86::BI__builtin_ia32_prord128:
4995 case clang::X86::BI__builtin_ia32_prord256:
4996 case clang::X86::BI__builtin_ia32_prord512:
4997 case clang::X86::BI__builtin_ia32_prorq128:
4998 case clang::X86::BI__builtin_ia32_prorq256:
4999 case clang::X86::BI__builtin_ia32_prorq512:
5002 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS.rotr(RHS); });
5004 case Builtin::BI__builtin_elementwise_max:
5005 case Builtin::BI__builtin_elementwise_min:
5008 case clang::X86::BI__builtin_ia32_phaddw128:
5009 case clang::X86::BI__builtin_ia32_phaddw256:
5010 case clang::X86::BI__builtin_ia32_phaddd128:
5011 case clang::X86::BI__builtin_ia32_phaddd256:
5014 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS + RHS; });
5015 case clang::X86::BI__builtin_ia32_phaddsw128:
5016 case clang::X86::BI__builtin_ia32_phaddsw256:
5019 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS.sadd_sat(RHS); });
5020 case clang::X86::BI__builtin_ia32_phsubw128:
5021 case clang::X86::BI__builtin_ia32_phsubw256:
5022 case clang::X86::BI__builtin_ia32_phsubd128:
5023 case clang::X86::BI__builtin_ia32_phsubd256:
5026 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS - RHS; });
5027 case clang::X86::BI__builtin_ia32_phsubsw128:
5028 case clang::X86::BI__builtin_ia32_phsubsw256:
5031 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS.ssub_sat(RHS); });
5032 case clang::X86::BI__builtin_ia32_haddpd:
5033 case clang::X86::BI__builtin_ia32_haddps:
5034 case clang::X86::BI__builtin_ia32_haddpd256:
5035 case clang::X86::BI__builtin_ia32_haddps256:
5038 [](
const APFloat &LHS,
const APFloat &RHS, llvm::RoundingMode RM) {
5043 case clang::X86::BI__builtin_ia32_hsubpd:
5044 case clang::X86::BI__builtin_ia32_hsubps:
5045 case clang::X86::BI__builtin_ia32_hsubpd256:
5046 case clang::X86::BI__builtin_ia32_hsubps256:
5049 [](
const APFloat &LHS,
const APFloat &RHS, llvm::RoundingMode RM) {
5051 F.subtract(RHS, RM);
5054 case clang::X86::BI__builtin_ia32_addsubpd:
5055 case clang::X86::BI__builtin_ia32_addsubps:
5056 case clang::X86::BI__builtin_ia32_addsubpd256:
5057 case clang::X86::BI__builtin_ia32_addsubps256:
5060 case clang::X86::BI__builtin_ia32_pmuldq128:
5061 case clang::X86::BI__builtin_ia32_pmuldq256:
5062 case clang::X86::BI__builtin_ia32_pmuldq512:
5067 return llvm::APIntOps::mulsExtended(LoLHS, LoRHS);
5070 case clang::X86::BI__builtin_ia32_pmuludq128:
5071 case clang::X86::BI__builtin_ia32_pmuludq256:
5072 case clang::X86::BI__builtin_ia32_pmuludq512:
5077 return llvm::APIntOps::muluExtended(LoLHS, LoRHS);
5080 case clang::X86::BI__builtin_ia32_pclmulqdq128:
5081 case clang::X86::BI__builtin_ia32_pclmulqdq256:
5082 case clang::X86::BI__builtin_ia32_pclmulqdq512:
5085 case Builtin::BI__builtin_elementwise_fma:
5089 llvm::RoundingMode RM) {
5091 F.fusedMultiplyAdd(Y, Z, RM);
5095 case X86::BI__builtin_ia32_vpmadd52luq128:
5096 case X86::BI__builtin_ia32_vpmadd52luq256:
5097 case X86::BI__builtin_ia32_vpmadd52luq512:
5100 return A + (B.trunc(52) *
C.trunc(52)).zext(64);
5102 case X86::BI__builtin_ia32_vpmadd52huq128:
5103 case X86::BI__builtin_ia32_vpmadd52huq256:
5104 case X86::BI__builtin_ia32_vpmadd52huq512:
5107 return A + llvm::APIntOps::mulhu(B.trunc(52),
C.trunc(52)).zext(64);
5110 case X86::BI__builtin_ia32_vpshldd128:
5111 case X86::BI__builtin_ia32_vpshldd256:
5112 case X86::BI__builtin_ia32_vpshldd512:
5113 case X86::BI__builtin_ia32_vpshldq128:
5114 case X86::BI__builtin_ia32_vpshldq256:
5115 case X86::BI__builtin_ia32_vpshldq512:
5116 case X86::BI__builtin_ia32_vpshldw128:
5117 case X86::BI__builtin_ia32_vpshldw256:
5118 case X86::BI__builtin_ia32_vpshldw512:
5122 return llvm::APIntOps::fshl(Hi, Lo, Amt);
5125 case X86::BI__builtin_ia32_vpshrdd128:
5126 case X86::BI__builtin_ia32_vpshrdd256:
5127 case X86::BI__builtin_ia32_vpshrdd512:
5128 case X86::BI__builtin_ia32_vpshrdq128:
5129 case X86::BI__builtin_ia32_vpshrdq256:
5130 case X86::BI__builtin_ia32_vpshrdq512:
5131 case X86::BI__builtin_ia32_vpshrdw128:
5132 case X86::BI__builtin_ia32_vpshrdw256:
5133 case X86::BI__builtin_ia32_vpshrdw512:
5138 return llvm::APIntOps::fshr(Hi, Lo, Amt);
5140 case X86::BI__builtin_ia32_vpconflictsi_128:
5141 case X86::BI__builtin_ia32_vpconflictsi_256:
5142 case X86::BI__builtin_ia32_vpconflictsi_512:
5143 case X86::BI__builtin_ia32_vpconflictdi_128:
5144 case X86::BI__builtin_ia32_vpconflictdi_256:
5145 case X86::BI__builtin_ia32_vpconflictdi_512:
5147 case X86::BI__builtin_ia32_compressdf128_mask:
5148 case X86::BI__builtin_ia32_compressdf256_mask:
5149 case X86::BI__builtin_ia32_compressdf512_mask:
5150 case X86::BI__builtin_ia32_compressdi128_mask:
5151 case X86::BI__builtin_ia32_compressdi256_mask:
5152 case X86::BI__builtin_ia32_compressdi512_mask:
5153 case X86::BI__builtin_ia32_compresshi128_mask:
5154 case X86::BI__builtin_ia32_compresshi256_mask:
5155 case X86::BI__builtin_ia32_compresshi512_mask:
5156 case X86::BI__builtin_ia32_compressqi128_mask:
5157 case X86::BI__builtin_ia32_compressqi256_mask:
5158 case X86::BI__builtin_ia32_compressqi512_mask:
5159 case X86::BI__builtin_ia32_compresssf128_mask:
5160 case X86::BI__builtin_ia32_compresssf256_mask:
5161 case X86::BI__builtin_ia32_compresssf512_mask:
5162 case X86::BI__builtin_ia32_compresssi128_mask:
5163 case X86::BI__builtin_ia32_compresssi256_mask:
5164 case X86::BI__builtin_ia32_compresssi512_mask: {
5166 Call->getArg(0)->getType()->castAs<
VectorType>()->getNumElements();
5168 S, OpPC,
Call, [NumElems](
unsigned DstIdx,
const APInt &ShuffleMask) {
5169 APInt CompressMask = ShuffleMask.trunc(NumElems);
5170 if (DstIdx < CompressMask.popcount()) {
5171 while (DstIdx != 0) {
5172 CompressMask = CompressMask & (CompressMask - 1);
5175 return std::pair<unsigned, int>{
5176 0,
static_cast<int>(CompressMask.countr_zero())};
5178 return std::pair<unsigned, int>{1,
static_cast<int>(DstIdx)};
5181 case X86::BI__builtin_ia32_expanddf128_mask:
5182 case X86::BI__builtin_ia32_expanddf256_mask:
5183 case X86::BI__builtin_ia32_expanddf512_mask:
5184 case X86::BI__builtin_ia32_expanddi128_mask:
5185 case X86::BI__builtin_ia32_expanddi256_mask:
5186 case X86::BI__builtin_ia32_expanddi512_mask:
5187 case X86::BI__builtin_ia32_expandhi128_mask:
5188 case X86::BI__builtin_ia32_expandhi256_mask:
5189 case X86::BI__builtin_ia32_expandhi512_mask:
5190 case X86::BI__builtin_ia32_expandqi128_mask:
5191 case X86::BI__builtin_ia32_expandqi256_mask:
5192 case X86::BI__builtin_ia32_expandqi512_mask:
5193 case X86::BI__builtin_ia32_expandsf128_mask:
5194 case X86::BI__builtin_ia32_expandsf256_mask:
5195 case X86::BI__builtin_ia32_expandsf512_mask:
5196 case X86::BI__builtin_ia32_expandsi128_mask:
5197 case X86::BI__builtin_ia32_expandsi256_mask:
5198 case X86::BI__builtin_ia32_expandsi512_mask: {
5200 S, OpPC,
Call, [](
unsigned DstIdx,
const APInt &ShuffleMask) {
5203 APInt ExpandMask = ShuffleMask.trunc(DstIdx + 1);
5204 if (ExpandMask[DstIdx]) {
5205 int SrcIdx = ExpandMask.popcount() - 1;
5206 return std::pair<unsigned, int>{0, SrcIdx};
5208 return std::pair<unsigned, int>{1,
static_cast<int>(DstIdx)};
5211 case clang::X86::BI__builtin_ia32_blendpd:
5212 case clang::X86::BI__builtin_ia32_blendpd256:
5213 case clang::X86::BI__builtin_ia32_blendps:
5214 case clang::X86::BI__builtin_ia32_blendps256:
5215 case clang::X86::BI__builtin_ia32_pblendw128:
5216 case clang::X86::BI__builtin_ia32_pblendw256:
5217 case clang::X86::BI__builtin_ia32_pblendd128:
5218 case clang::X86::BI__builtin_ia32_pblendd256:
5220 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5222 unsigned MaskBit = (ShuffleMask >> (DstIdx % 8)) & 0x1;
5223 unsigned SrcVecIdx = MaskBit ? 1 : 0;
5224 return std::pair<unsigned, int>{SrcVecIdx,
static_cast<int>(DstIdx)};
5229 case clang::X86::BI__builtin_ia32_blendvpd:
5230 case clang::X86::BI__builtin_ia32_blendvpd256:
5231 case clang::X86::BI__builtin_ia32_blendvps:
5232 case clang::X86::BI__builtin_ia32_blendvps256:
5236 llvm::RoundingMode) {
return C.isNegative() ? T : F; });
5238 case clang::X86::BI__builtin_ia32_pblendvb128:
5239 case clang::X86::BI__builtin_ia32_pblendvb256:
5242 return ((
APInt)
C).isNegative() ? T : F;
5244 case X86::BI__builtin_ia32_ptestz128:
5245 case X86::BI__builtin_ia32_ptestz256:
5246 case X86::BI__builtin_ia32_vtestzps:
5247 case X86::BI__builtin_ia32_vtestzps256:
5248 case X86::BI__builtin_ia32_vtestzpd:
5249 case X86::BI__builtin_ia32_vtestzpd256:
5252 [](
const APInt &A,
const APInt &B) {
return (A & B) == 0; });
5253 case X86::BI__builtin_ia32_ptestc128:
5254 case X86::BI__builtin_ia32_ptestc256:
5255 case X86::BI__builtin_ia32_vtestcps:
5256 case X86::BI__builtin_ia32_vtestcps256:
5257 case X86::BI__builtin_ia32_vtestcpd:
5258 case X86::BI__builtin_ia32_vtestcpd256:
5261 [](
const APInt &A,
const APInt &B) {
return (~A & B) == 0; });
5262 case X86::BI__builtin_ia32_ptestnzc128:
5263 case X86::BI__builtin_ia32_ptestnzc256:
5264 case X86::BI__builtin_ia32_vtestnzcps:
5265 case X86::BI__builtin_ia32_vtestnzcps256:
5266 case X86::BI__builtin_ia32_vtestnzcpd:
5267 case X86::BI__builtin_ia32_vtestnzcpd256:
5270 return ((A & B) != 0) && ((~A & B) != 0);
5272 case X86::BI__builtin_ia32_selectb_128:
5273 case X86::BI__builtin_ia32_selectb_256:
5274 case X86::BI__builtin_ia32_selectb_512:
5275 case X86::BI__builtin_ia32_selectw_128:
5276 case X86::BI__builtin_ia32_selectw_256:
5277 case X86::BI__builtin_ia32_selectw_512:
5278 case X86::BI__builtin_ia32_selectd_128:
5279 case X86::BI__builtin_ia32_selectd_256:
5280 case X86::BI__builtin_ia32_selectd_512:
5281 case X86::BI__builtin_ia32_selectq_128:
5282 case X86::BI__builtin_ia32_selectq_256:
5283 case X86::BI__builtin_ia32_selectq_512:
5284 case X86::BI__builtin_ia32_selectph_128:
5285 case X86::BI__builtin_ia32_selectph_256:
5286 case X86::BI__builtin_ia32_selectph_512:
5287 case X86::BI__builtin_ia32_selectpbf_128:
5288 case X86::BI__builtin_ia32_selectpbf_256:
5289 case X86::BI__builtin_ia32_selectpbf_512:
5290 case X86::BI__builtin_ia32_selectps_128:
5291 case X86::BI__builtin_ia32_selectps_256:
5292 case X86::BI__builtin_ia32_selectps_512:
5293 case X86::BI__builtin_ia32_selectpd_128:
5294 case X86::BI__builtin_ia32_selectpd_256:
5295 case X86::BI__builtin_ia32_selectpd_512:
5298 case X86::BI__builtin_ia32_shufps:
5299 case X86::BI__builtin_ia32_shufps256:
5300 case X86::BI__builtin_ia32_shufps512:
5302 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5303 unsigned NumElemPerLane = 4;
5304 unsigned NumSelectableElems = NumElemPerLane / 2;
5305 unsigned BitsPerElem = 2;
5306 unsigned IndexMask = 0x3;
5307 unsigned MaskBits = 8;
5308 unsigned Lane = DstIdx / NumElemPerLane;
5309 unsigned ElemInLane = DstIdx % NumElemPerLane;
5310 unsigned LaneOffset = Lane * NumElemPerLane;
5311 unsigned SrcIdx = ElemInLane >= NumSelectableElems ? 1 : 0;
5312 unsigned BitIndex = (DstIdx * BitsPerElem) % MaskBits;
5313 unsigned Index = (ShuffleMask >> BitIndex) & IndexMask;
5314 return std::pair<unsigned, int>{SrcIdx,
5315 static_cast<int>(LaneOffset + Index)};
5317 case X86::BI__builtin_ia32_shufpd:
5318 case X86::BI__builtin_ia32_shufpd256:
5319 case X86::BI__builtin_ia32_shufpd512:
5321 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5322 unsigned NumElemPerLane = 2;
5323 unsigned NumSelectableElems = NumElemPerLane / 2;
5324 unsigned BitsPerElem = 1;
5325 unsigned IndexMask = 0x1;
5326 unsigned MaskBits = 8;
5327 unsigned Lane = DstIdx / NumElemPerLane;
5328 unsigned ElemInLane = DstIdx % NumElemPerLane;
5329 unsigned LaneOffset = Lane * NumElemPerLane;
5330 unsigned SrcIdx = ElemInLane >= NumSelectableElems ? 1 : 0;
5331 unsigned BitIndex = (DstIdx * BitsPerElem) % MaskBits;
5332 unsigned Index = (ShuffleMask >> BitIndex) & IndexMask;
5333 return std::pair<unsigned, int>{SrcIdx,
5334 static_cast<int>(LaneOffset + Index)};
5337 case X86::BI__builtin_ia32_vgf2p8affineinvqb_v16qi:
5338 case X86::BI__builtin_ia32_vgf2p8affineinvqb_v32qi:
5339 case X86::BI__builtin_ia32_vgf2p8affineinvqb_v64qi:
5341 case X86::BI__builtin_ia32_vgf2p8affineqb_v16qi:
5342 case X86::BI__builtin_ia32_vgf2p8affineqb_v32qi:
5343 case X86::BI__builtin_ia32_vgf2p8affineqb_v64qi:
5346 case X86::BI__builtin_ia32_vgf2p8mulb_v16qi:
5347 case X86::BI__builtin_ia32_vgf2p8mulb_v32qi:
5348 case X86::BI__builtin_ia32_vgf2p8mulb_v64qi:
5351 case X86::BI__builtin_ia32_insertps128:
5353 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned Mask) {
5355 if ((Mask & (1 << DstIdx)) != 0) {
5356 return std::pair<unsigned, int>{0, -1};
5360 unsigned SrcElem = (Mask >> 6) & 0x3;
5361 unsigned DstElem = (Mask >> 4) & 0x3;
5362 if (DstIdx == DstElem) {
5364 return std::pair<unsigned, int>{1,
static_cast<int>(SrcElem)};
5367 return std::pair<unsigned, int>{0,
static_cast<int>(DstIdx)};
5370 case X86::BI__builtin_ia32_permvarsi256:
5371 case X86::BI__builtin_ia32_permvarsf256:
5372 case X86::BI__builtin_ia32_permvardf512:
5373 case X86::BI__builtin_ia32_permvardi512:
5374 case X86::BI__builtin_ia32_permvarhi128:
5376 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5377 int Offset = ShuffleMask & 0x7;
5378 return std::pair<unsigned, int>{0, Offset};
5380 case X86::BI__builtin_ia32_permvarqi128:
5381 case X86::BI__builtin_ia32_permvarhi256:
5382 case X86::BI__builtin_ia32_permvarsi512:
5383 case X86::BI__builtin_ia32_permvarsf512:
5385 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5386 int Offset = ShuffleMask & 0xF;
5387 return std::pair<unsigned, int>{0, Offset};
5389 case X86::BI__builtin_ia32_permvardi256:
5390 case X86::BI__builtin_ia32_permvardf256:
5392 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5393 int Offset = ShuffleMask & 0x3;
5394 return std::pair<unsigned, int>{0, Offset};
5396 case X86::BI__builtin_ia32_permvarqi256:
5397 case X86::BI__builtin_ia32_permvarhi512:
5399 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5400 int Offset = ShuffleMask & 0x1F;
5401 return std::pair<unsigned, int>{0, Offset};
5403 case X86::BI__builtin_ia32_permvarqi512:
5405 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5406 int Offset = ShuffleMask & 0x3F;
5407 return std::pair<unsigned, int>{0, Offset};
5409 case X86::BI__builtin_ia32_vpermi2varq128:
5410 case X86::BI__builtin_ia32_vpermi2varpd128:
5412 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5413 int Offset = ShuffleMask & 0x1;
5414 unsigned SrcIdx = (ShuffleMask >> 1) & 0x1;
5415 return std::pair<unsigned, int>{SrcIdx, Offset};
5417 case X86::BI__builtin_ia32_vpermi2vard128:
5418 case X86::BI__builtin_ia32_vpermi2varps128:
5419 case X86::BI__builtin_ia32_vpermi2varq256:
5420 case X86::BI__builtin_ia32_vpermi2varpd256:
5422 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5423 int Offset = ShuffleMask & 0x3;
5424 unsigned SrcIdx = (ShuffleMask >> 2) & 0x1;
5425 return std::pair<unsigned, int>{SrcIdx, Offset};
5427 case X86::BI__builtin_ia32_vpermi2varhi128:
5428 case X86::BI__builtin_ia32_vpermi2vard256:
5429 case X86::BI__builtin_ia32_vpermi2varps256:
5430 case X86::BI__builtin_ia32_vpermi2varq512:
5431 case X86::BI__builtin_ia32_vpermi2varpd512:
5433 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5434 int Offset = ShuffleMask & 0x7;
5435 unsigned SrcIdx = (ShuffleMask >> 3) & 0x1;
5436 return std::pair<unsigned, int>{SrcIdx, Offset};
5438 case X86::BI__builtin_ia32_vpermi2varqi128:
5439 case X86::BI__builtin_ia32_vpermi2varhi256:
5440 case X86::BI__builtin_ia32_vpermi2vard512:
5441 case X86::BI__builtin_ia32_vpermi2varps512:
5443 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5444 int Offset = ShuffleMask & 0xF;
5445 unsigned SrcIdx = (ShuffleMask >> 4) & 0x1;
5446 return std::pair<unsigned, int>{SrcIdx, Offset};
5448 case X86::BI__builtin_ia32_vpermi2varqi256:
5449 case X86::BI__builtin_ia32_vpermi2varhi512:
5451 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5452 int Offset = ShuffleMask & 0x1F;
5453 unsigned SrcIdx = (ShuffleMask >> 5) & 0x1;
5454 return std::pair<unsigned, int>{SrcIdx, Offset};
5456 case X86::BI__builtin_ia32_vpermi2varqi512:
5458 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5459 int Offset = ShuffleMask & 0x3F;
5460 unsigned SrcIdx = (ShuffleMask >> 6) & 0x1;
5461 return std::pair<unsigned, int>{SrcIdx, Offset};
5463 case X86::BI__builtin_ia32_vperm2f128_pd256:
5464 case X86::BI__builtin_ia32_vperm2f128_ps256:
5465 case X86::BI__builtin_ia32_vperm2f128_si256:
5466 case X86::BI__builtin_ia32_permti256: {
5467 unsigned NumElements =
5468 Call->getArg(0)->getType()->castAs<
VectorType>()->getNumElements();
5469 unsigned PreservedBitsCnt = NumElements >> 2;
5472 [PreservedBitsCnt](
unsigned DstIdx,
unsigned ShuffleMask) {
5473 unsigned ControlBitsCnt = DstIdx >> PreservedBitsCnt << 2;
5474 unsigned ControlBits = ShuffleMask >> ControlBitsCnt;
5476 if (ControlBits & 0b1000)
5477 return std::make_pair(0u, -1);
5479 unsigned SrcVecIdx = (ControlBits & 0b10) >> 1;
5480 unsigned PreservedBitsMask = (1 << PreservedBitsCnt) - 1;
5481 int SrcIdx = ((ControlBits & 0b1) << PreservedBitsCnt) |
5482 (DstIdx & PreservedBitsMask);
5483 return std::make_pair(SrcVecIdx, SrcIdx);
5486 case X86::BI__builtin_ia32_pshufb128:
5487 case X86::BI__builtin_ia32_pshufb256:
5488 case X86::BI__builtin_ia32_pshufb512:
5490 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5491 uint8_t Ctlb =
static_cast<uint8_t
>(ShuffleMask);
5493 return std::make_pair(0, -1);
5495 unsigned LaneBase = (DstIdx / 16) * 16;
5496 unsigned SrcOffset = Ctlb & 0x0F;
5497 unsigned SrcIdx = LaneBase + SrcOffset;
5498 return std::make_pair(0,
static_cast<int>(SrcIdx));
5501 case X86::BI__builtin_ia32_pshuflw:
5502 case X86::BI__builtin_ia32_pshuflw256:
5503 case X86::BI__builtin_ia32_pshuflw512:
5505 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5506 unsigned LaneBase = (DstIdx / 8) * 8;
5507 unsigned LaneIdx = DstIdx % 8;
5509 unsigned Sel = (ShuffleMask >> (2 * LaneIdx)) & 0x3;
5510 return std::make_pair(0,
static_cast<int>(LaneBase + Sel));
5513 return std::make_pair(0,
static_cast<int>(DstIdx));
5516 case X86::BI__builtin_ia32_pshufhw:
5517 case X86::BI__builtin_ia32_pshufhw256:
5518 case X86::BI__builtin_ia32_pshufhw512:
5520 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5521 unsigned LaneBase = (DstIdx / 8) * 8;
5522 unsigned LaneIdx = DstIdx % 8;
5524 unsigned Sel = (ShuffleMask >> (2 * (LaneIdx - 4))) & 0x3;
5525 return std::make_pair(0,
static_cast<int>(LaneBase + 4 + Sel));
5528 return std::make_pair(0,
static_cast<int>(DstIdx));
5531 case X86::BI__builtin_ia32_pshufd:
5532 case X86::BI__builtin_ia32_pshufd256:
5533 case X86::BI__builtin_ia32_pshufd512:
5534 case X86::BI__builtin_ia32_vpermilps:
5535 case X86::BI__builtin_ia32_vpermilps256:
5536 case X86::BI__builtin_ia32_vpermilps512:
5538 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5539 unsigned LaneBase = (DstIdx / 4) * 4;
5540 unsigned LaneIdx = DstIdx % 4;
5541 unsigned Sel = (ShuffleMask >> (2 * LaneIdx)) & 0x3;
5542 return std::make_pair(0,
static_cast<int>(LaneBase + Sel));
5545 case X86::BI__builtin_ia32_vpermilvarpd:
5546 case X86::BI__builtin_ia32_vpermilvarpd256:
5547 case X86::BI__builtin_ia32_vpermilvarpd512:
5549 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5550 unsigned NumElemPerLane = 2;
5551 unsigned Lane = DstIdx / NumElemPerLane;
5552 unsigned Offset = ShuffleMask & 0b10 ? 1 : 0;
5553 return std::make_pair(
5554 0,
static_cast<int>(Lane * NumElemPerLane + Offset));
5557 case X86::BI__builtin_ia32_vpermilvarps:
5558 case X86::BI__builtin_ia32_vpermilvarps256:
5559 case X86::BI__builtin_ia32_vpermilvarps512:
5561 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned ShuffleMask) {
5562 unsigned NumElemPerLane = 4;
5563 unsigned Lane = DstIdx / NumElemPerLane;
5564 unsigned Offset = ShuffleMask & 0b11;
5565 return std::make_pair(
5566 0,
static_cast<int>(Lane * NumElemPerLane + Offset));
5569 case X86::BI__builtin_ia32_vpermilpd:
5570 case X86::BI__builtin_ia32_vpermilpd256:
5571 case X86::BI__builtin_ia32_vpermilpd512:
5573 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned Control) {
5574 unsigned NumElemPerLane = 2;
5575 unsigned BitsPerElem = 1;
5576 unsigned MaskBits = 8;
5577 unsigned IndexMask = 0x1;
5578 unsigned Lane = DstIdx / NumElemPerLane;
5579 unsigned LaneOffset = Lane * NumElemPerLane;
5580 unsigned BitIndex = (DstIdx * BitsPerElem) % MaskBits;
5581 unsigned Index = (Control >> BitIndex) & IndexMask;
5582 return std::make_pair(0,
static_cast<int>(LaneOffset + Index));
5585 case X86::BI__builtin_ia32_permdf256:
5586 case X86::BI__builtin_ia32_permdi256:
5588 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned Control) {
5591 unsigned Index = (Control >> (2 * DstIdx)) & 0x3;
5592 return std::make_pair(0,
static_cast<int>(Index));
5595 case X86::BI__builtin_ia32_vpmultishiftqb128:
5596 case X86::BI__builtin_ia32_vpmultishiftqb256:
5597 case X86::BI__builtin_ia32_vpmultishiftqb512:
5599 case X86::BI__builtin_ia32_kandqi:
5600 case X86::BI__builtin_ia32_kandhi:
5601 case X86::BI__builtin_ia32_kandsi:
5602 case X86::BI__builtin_ia32_kanddi:
5605 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS & RHS; });
5607 case X86::BI__builtin_ia32_kandnqi:
5608 case X86::BI__builtin_ia32_kandnhi:
5609 case X86::BI__builtin_ia32_kandnsi:
5610 case X86::BI__builtin_ia32_kandndi:
5613 [](
const APSInt &LHS,
const APSInt &RHS) {
return ~LHS & RHS; });
5615 case X86::BI__builtin_ia32_korqi:
5616 case X86::BI__builtin_ia32_korhi:
5617 case X86::BI__builtin_ia32_korsi:
5618 case X86::BI__builtin_ia32_kordi:
5621 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS | RHS; });
5623 case X86::BI__builtin_ia32_kxnorqi:
5624 case X86::BI__builtin_ia32_kxnorhi:
5625 case X86::BI__builtin_ia32_kxnorsi:
5626 case X86::BI__builtin_ia32_kxnordi:
5629 [](
const APSInt &LHS,
const APSInt &RHS) {
return ~(LHS ^ RHS); });
5631 case X86::BI__builtin_ia32_kxorqi:
5632 case X86::BI__builtin_ia32_kxorhi:
5633 case X86::BI__builtin_ia32_kxorsi:
5634 case X86::BI__builtin_ia32_kxordi:
5637 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS ^ RHS; });
5639 case X86::BI__builtin_ia32_knotqi:
5640 case X86::BI__builtin_ia32_knothi:
5641 case X86::BI__builtin_ia32_knotsi:
5642 case X86::BI__builtin_ia32_knotdi:
5644 S, OpPC,
Call, [](
const APSInt &Src) {
return ~Src; });
5646 case X86::BI__builtin_ia32_kaddqi:
5647 case X86::BI__builtin_ia32_kaddhi:
5648 case X86::BI__builtin_ia32_kaddsi:
5649 case X86::BI__builtin_ia32_kadddi:
5652 [](
const APSInt &LHS,
const APSInt &RHS) {
return LHS + RHS; });
5654 case X86::BI__builtin_ia32_kmovb:
5655 case X86::BI__builtin_ia32_kmovw:
5656 case X86::BI__builtin_ia32_kmovd:
5657 case X86::BI__builtin_ia32_kmovq:
5659 S, OpPC,
Call, [](
const APSInt &Src) {
return Src; });
5661 case X86::BI__builtin_ia32_kunpckhi:
5662 case X86::BI__builtin_ia32_kunpckdi:
5663 case X86::BI__builtin_ia32_kunpcksi:
5668 unsigned BW = A.getBitWidth();
5669 return APSInt(A.trunc(BW / 2).concat(B.trunc(BW / 2)),
5673 case X86::BI__builtin_ia32_phminposuw128:
5676 case X86::BI__builtin_ia32_psraq128:
5677 case X86::BI__builtin_ia32_psraq256:
5678 case X86::BI__builtin_ia32_psraq512:
5679 case X86::BI__builtin_ia32_psrad128:
5680 case X86::BI__builtin_ia32_psrad256:
5681 case X86::BI__builtin_ia32_psrad512:
5682 case X86::BI__builtin_ia32_psraw128:
5683 case X86::BI__builtin_ia32_psraw256:
5684 case X86::BI__builtin_ia32_psraw512:
5687 [](
const APInt &Elt, uint64_t Count) {
return Elt.ashr(Count); },
5688 [](
const APInt &Elt,
unsigned Width) {
return Elt.ashr(Width - 1); });
5690 case X86::BI__builtin_ia32_psllq128:
5691 case X86::BI__builtin_ia32_psllq256:
5692 case X86::BI__builtin_ia32_psllq512:
5693 case X86::BI__builtin_ia32_pslld128:
5694 case X86::BI__builtin_ia32_pslld256:
5695 case X86::BI__builtin_ia32_pslld512:
5696 case X86::BI__builtin_ia32_psllw128:
5697 case X86::BI__builtin_ia32_psllw256:
5698 case X86::BI__builtin_ia32_psllw512:
5701 [](
const APInt &Elt, uint64_t Count) {
return Elt.shl(Count); },
5702 [](
const APInt &Elt,
unsigned Width) {
return APInt::getZero(Width); });
5704 case X86::BI__builtin_ia32_psrlq128:
5705 case X86::BI__builtin_ia32_psrlq256:
5706 case X86::BI__builtin_ia32_psrlq512:
5707 case X86::BI__builtin_ia32_psrld128:
5708 case X86::BI__builtin_ia32_psrld256:
5709 case X86::BI__builtin_ia32_psrld512:
5710 case X86::BI__builtin_ia32_psrlw128:
5711 case X86::BI__builtin_ia32_psrlw256:
5712 case X86::BI__builtin_ia32_psrlw512:
5715 [](
const APInt &Elt, uint64_t Count) {
return Elt.lshr(Count); },
5716 [](
const APInt &Elt,
unsigned Width) {
return APInt::getZero(Width); });
5718 case X86::BI__builtin_ia32_pternlogd128_mask:
5719 case X86::BI__builtin_ia32_pternlogd256_mask:
5720 case X86::BI__builtin_ia32_pternlogd512_mask:
5721 case X86::BI__builtin_ia32_pternlogq128_mask:
5722 case X86::BI__builtin_ia32_pternlogq256_mask:
5723 case X86::BI__builtin_ia32_pternlogq512_mask:
5725 case X86::BI__builtin_ia32_pternlogd128_maskz:
5726 case X86::BI__builtin_ia32_pternlogd256_maskz:
5727 case X86::BI__builtin_ia32_pternlogd512_maskz:
5728 case X86::BI__builtin_ia32_pternlogq128_maskz:
5729 case X86::BI__builtin_ia32_pternlogq256_maskz:
5730 case X86::BI__builtin_ia32_pternlogq512_maskz:
5732 case Builtin::BI__builtin_elementwise_fshl:
5734 llvm::APIntOps::fshl);
5735 case Builtin::BI__builtin_elementwise_fshr:
5737 llvm::APIntOps::fshr);
5739 case X86::BI__builtin_ia32_shuf_f32x4_256:
5740 case X86::BI__builtin_ia32_shuf_i32x4_256:
5741 case X86::BI__builtin_ia32_shuf_f64x2_256:
5742 case X86::BI__builtin_ia32_shuf_i64x2_256:
5743 case X86::BI__builtin_ia32_shuf_f32x4:
5744 case X86::BI__builtin_ia32_shuf_i32x4:
5745 case X86::BI__builtin_ia32_shuf_f64x2:
5746 case X86::BI__builtin_ia32_shuf_i64x2: {
5752 unsigned LaneBits = 128u;
5753 unsigned NumLanes = (NumElems * ElemBits) / LaneBits;
5754 unsigned NumElemsPerLane = LaneBits / ElemBits;
5758 [NumLanes, NumElemsPerLane](
unsigned DstIdx,
unsigned ShuffleMask) {
5760 unsigned BitsPerElem = NumLanes / 2;
5761 unsigned IndexMask = (1u << BitsPerElem) - 1;
5762 unsigned Lane = DstIdx / NumElemsPerLane;
5763 unsigned SrcIdx = (Lane < NumLanes / 2) ? 0 : 1;
5764 unsigned BitIdx = BitsPerElem * Lane;
5765 unsigned SrcLaneIdx = (ShuffleMask >> BitIdx) & IndexMask;
5766 unsigned ElemInLane = DstIdx % NumElemsPerLane;
5767 unsigned IdxToPick = SrcLaneIdx * NumElemsPerLane + ElemInLane;
5768 return std::pair<unsigned, int>{SrcIdx, IdxToPick};
5772 case X86::BI__builtin_ia32_insertf32x4_256:
5773 case X86::BI__builtin_ia32_inserti32x4_256:
5774 case X86::BI__builtin_ia32_insertf64x2_256:
5775 case X86::BI__builtin_ia32_inserti64x2_256:
5776 case X86::BI__builtin_ia32_insertf32x4:
5777 case X86::BI__builtin_ia32_inserti32x4:
5778 case X86::BI__builtin_ia32_insertf64x2_512:
5779 case X86::BI__builtin_ia32_inserti64x2_512:
5780 case X86::BI__builtin_ia32_insertf32x8:
5781 case X86::BI__builtin_ia32_inserti32x8:
5782 case X86::BI__builtin_ia32_insertf64x4:
5783 case X86::BI__builtin_ia32_inserti64x4:
5784 case X86::BI__builtin_ia32_vinsertf128_ps256:
5785 case X86::BI__builtin_ia32_vinsertf128_pd256:
5786 case X86::BI__builtin_ia32_vinsertf128_si256:
5787 case X86::BI__builtin_ia32_insert128i256:
5790 case clang::X86::BI__builtin_ia32_vcvtps2ph:
5791 case clang::X86::BI__builtin_ia32_vcvtps2ph256:
5794 case X86::BI__builtin_ia32_vec_ext_v4hi:
5795 case X86::BI__builtin_ia32_vec_ext_v16qi:
5796 case X86::BI__builtin_ia32_vec_ext_v8hi:
5797 case X86::BI__builtin_ia32_vec_ext_v4si:
5798 case X86::BI__builtin_ia32_vec_ext_v2di:
5799 case X86::BI__builtin_ia32_vec_ext_v32qi:
5800 case X86::BI__builtin_ia32_vec_ext_v16hi:
5801 case X86::BI__builtin_ia32_vec_ext_v8si:
5802 case X86::BI__builtin_ia32_vec_ext_v4di:
5803 case X86::BI__builtin_ia32_vec_ext_v4sf:
5806 case X86::BI__builtin_ia32_vec_set_v4hi:
5807 case X86::BI__builtin_ia32_vec_set_v16qi:
5808 case X86::BI__builtin_ia32_vec_set_v8hi:
5809 case X86::BI__builtin_ia32_vec_set_v4si:
5810 case X86::BI__builtin_ia32_vec_set_v2di:
5811 case X86::BI__builtin_ia32_vec_set_v32qi:
5812 case X86::BI__builtin_ia32_vec_set_v16hi:
5813 case X86::BI__builtin_ia32_vec_set_v8si:
5814 case X86::BI__builtin_ia32_vec_set_v4di:
5817 case X86::BI__builtin_ia32_cvtb2mask128:
5818 case X86::BI__builtin_ia32_cvtb2mask256:
5819 case X86::BI__builtin_ia32_cvtb2mask512:
5820 case X86::BI__builtin_ia32_cvtw2mask128:
5821 case X86::BI__builtin_ia32_cvtw2mask256:
5822 case X86::BI__builtin_ia32_cvtw2mask512:
5823 case X86::BI__builtin_ia32_cvtd2mask128:
5824 case X86::BI__builtin_ia32_cvtd2mask256:
5825 case X86::BI__builtin_ia32_cvtd2mask512:
5826 case X86::BI__builtin_ia32_cvtq2mask128:
5827 case X86::BI__builtin_ia32_cvtq2mask256:
5828 case X86::BI__builtin_ia32_cvtq2mask512:
5831 case X86::BI__builtin_ia32_cvtmask2b128:
5832 case X86::BI__builtin_ia32_cvtmask2b256:
5833 case X86::BI__builtin_ia32_cvtmask2b512:
5834 case X86::BI__builtin_ia32_cvtmask2w128:
5835 case X86::BI__builtin_ia32_cvtmask2w256:
5836 case X86::BI__builtin_ia32_cvtmask2w512:
5837 case X86::BI__builtin_ia32_cvtmask2d128:
5838 case X86::BI__builtin_ia32_cvtmask2d256:
5839 case X86::BI__builtin_ia32_cvtmask2d512:
5840 case X86::BI__builtin_ia32_cvtmask2q128:
5841 case X86::BI__builtin_ia32_cvtmask2q256:
5842 case X86::BI__builtin_ia32_cvtmask2q512:
5845 case X86::BI__builtin_ia32_cvtsd2ss:
5848 case X86::BI__builtin_ia32_cvtsd2ss_round_mask:
5851 case X86::BI__builtin_ia32_cvtpd2ps:
5852 case X86::BI__builtin_ia32_cvtpd2ps256:
5854 case X86::BI__builtin_ia32_cvtpd2ps_mask:
5856 case X86::BI__builtin_ia32_cvtpd2ps512_mask:
5859 case X86::BI__builtin_ia32_cmpb128_mask:
5860 case X86::BI__builtin_ia32_cmpw128_mask:
5861 case X86::BI__builtin_ia32_cmpd128_mask:
5862 case X86::BI__builtin_ia32_cmpq128_mask:
5863 case X86::BI__builtin_ia32_cmpb256_mask:
5864 case X86::BI__builtin_ia32_cmpw256_mask:
5865 case X86::BI__builtin_ia32_cmpd256_mask:
5866 case X86::BI__builtin_ia32_cmpq256_mask:
5867 case X86::BI__builtin_ia32_cmpb512_mask:
5868 case X86::BI__builtin_ia32_cmpw512_mask:
5869 case X86::BI__builtin_ia32_cmpd512_mask:
5870 case X86::BI__builtin_ia32_cmpq512_mask:
5874 case X86::BI__builtin_ia32_ucmpb128_mask:
5875 case X86::BI__builtin_ia32_ucmpw128_mask:
5876 case X86::BI__builtin_ia32_ucmpd128_mask:
5877 case X86::BI__builtin_ia32_ucmpq128_mask:
5878 case X86::BI__builtin_ia32_ucmpb256_mask:
5879 case X86::BI__builtin_ia32_ucmpw256_mask:
5880 case X86::BI__builtin_ia32_ucmpd256_mask:
5881 case X86::BI__builtin_ia32_ucmpq256_mask:
5882 case X86::BI__builtin_ia32_ucmpb512_mask:
5883 case X86::BI__builtin_ia32_ucmpw512_mask:
5884 case X86::BI__builtin_ia32_ucmpd512_mask:
5885 case X86::BI__builtin_ia32_ucmpq512_mask:
5889 case X86::BI__builtin_ia32_vpshufbitqmb128_mask:
5890 case X86::BI__builtin_ia32_vpshufbitqmb256_mask:
5891 case X86::BI__builtin_ia32_vpshufbitqmb512_mask:
5894 case X86::BI__builtin_ia32_pslldqi128_byteshift:
5895 case X86::BI__builtin_ia32_pslldqi256_byteshift:
5896 case X86::BI__builtin_ia32_pslldqi512_byteshift:
5903 [](
unsigned DstIdx,
unsigned Shift) -> std::pair<unsigned, int> {
5904 unsigned LaneBase = (DstIdx / 16) * 16;
5905 unsigned LaneIdx = DstIdx % 16;
5906 if (LaneIdx < Shift)
5907 return std::make_pair(0, -1);
5909 return std::make_pair(0,
5910 static_cast<int>(LaneBase + LaneIdx - Shift));
5913 case X86::BI__builtin_ia32_psrldqi128_byteshift:
5914 case X86::BI__builtin_ia32_psrldqi256_byteshift:
5915 case X86::BI__builtin_ia32_psrldqi512_byteshift:
5922 [](
unsigned DstIdx,
unsigned Shift) -> std::pair<unsigned, int> {
5923 unsigned LaneBase = (DstIdx / 16) * 16;
5924 unsigned LaneIdx = DstIdx % 16;
5925 if (LaneIdx + Shift < 16)
5926 return std::make_pair(0,
5927 static_cast<int>(LaneBase + LaneIdx + Shift));
5929 return std::make_pair(0, -1);
5932 case X86::BI__builtin_ia32_palignr128:
5933 case X86::BI__builtin_ia32_palignr256:
5934 case X86::BI__builtin_ia32_palignr512:
5936 S, OpPC,
Call, [](
unsigned DstIdx,
unsigned Shift) {
5938 unsigned VecIdx = 1;
5941 int Lane = DstIdx / 16;
5942 int Offset = DstIdx % 16;
5945 unsigned ShiftedIdx = Offset + (Shift & 0xFF);
5946 if (ShiftedIdx < 16) {
5947 ElemIdx = ShiftedIdx + (Lane * 16);
5948 }
else if (ShiftedIdx < 32) {
5950 ElemIdx = (ShiftedIdx - 16) + (Lane * 16);
5953 return std::pair<unsigned, int>{VecIdx, ElemIdx};
5956 case X86::BI__builtin_ia32_alignd128:
5957 case X86::BI__builtin_ia32_alignd256:
5958 case X86::BI__builtin_ia32_alignd512:
5959 case X86::BI__builtin_ia32_alignq128:
5960 case X86::BI__builtin_ia32_alignq256:
5961 case X86::BI__builtin_ia32_alignq512: {
5962 unsigned NumElems =
Call->getType()->castAs<
VectorType>()->getNumElements();
5964 S, OpPC,
Call, [NumElems](
unsigned DstIdx,
unsigned Shift) {
5965 unsigned Imm = Shift & 0xFF;
5966 unsigned EffectiveShift = Imm & (NumElems - 1);
5967 unsigned SourcePos = DstIdx + EffectiveShift;
5968 unsigned VecIdx = SourcePos < NumElems ? 1u : 0u;
5969 unsigned ElemIdx = SourcePos & (NumElems - 1);
5970 return std::pair<unsigned, int>{VecIdx,
static_cast<int>(ElemIdx)};
5974 case clang::X86::BI__builtin_ia32_minps:
5975 case clang::X86::BI__builtin_ia32_minpd:
5976 case clang::X86::BI__builtin_ia32_minph128:
5977 case clang::X86::BI__builtin_ia32_minph256:
5978 case clang::X86::BI__builtin_ia32_minps256:
5979 case clang::X86::BI__builtin_ia32_minpd256:
5980 case clang::X86::BI__builtin_ia32_minps512:
5981 case clang::X86::BI__builtin_ia32_minpd512:
5982 case clang::X86::BI__builtin_ia32_minph512:
5986 std::optional<APSInt>) -> std::optional<APFloat> {
5987 if (A.isNaN() || A.isInfinity() || A.isDenormal() || B.isNaN() ||
5988 B.isInfinity() || B.isDenormal())
5989 return std::nullopt;
5990 if (A.isZero() && B.isZero())
5992 return llvm::minimum(A, B);
5995 case clang::X86::BI__builtin_ia32_minss:
5996 case clang::X86::BI__builtin_ia32_minsd:
6000 std::optional<APSInt> RoundingMode) -> std::optional<APFloat> {
6005 case clang::X86::BI__builtin_ia32_minsd_round_mask:
6006 case clang::X86::BI__builtin_ia32_minss_round_mask:
6007 case clang::X86::BI__builtin_ia32_minsh_round_mask:
6008 case clang::X86::BI__builtin_ia32_maxsd_round_mask:
6009 case clang::X86::BI__builtin_ia32_maxss_round_mask:
6010 case clang::X86::BI__builtin_ia32_maxsh_round_mask: {
6011 bool IsMin = BuiltinID == clang::X86::BI__builtin_ia32_minsd_round_mask ||
6012 BuiltinID == clang::X86::BI__builtin_ia32_minss_round_mask ||
6013 BuiltinID == clang::X86::BI__builtin_ia32_minsh_round_mask;
6017 std::optional<APSInt> RoundingMode) -> std::optional<APFloat> {
6022 case clang::X86::BI__builtin_ia32_maxps:
6023 case clang::X86::BI__builtin_ia32_maxpd:
6024 case clang::X86::BI__builtin_ia32_maxph128:
6025 case clang::X86::BI__builtin_ia32_maxph256:
6026 case clang::X86::BI__builtin_ia32_maxps256:
6027 case clang::X86::BI__builtin_ia32_maxpd256:
6028 case clang::X86::BI__builtin_ia32_maxps512:
6029 case clang::X86::BI__builtin_ia32_maxpd512:
6030 case clang::X86::BI__builtin_ia32_maxph512:
6034 std::optional<APSInt>) -> std::optional<APFloat> {
6035 if (A.isNaN() || A.isInfinity() || A.isDenormal() || B.isNaN() ||
6036 B.isInfinity() || B.isDenormal())
6037 return std::nullopt;
6038 if (A.isZero() && B.isZero())
6040 return llvm::maximum(A, B);
6043 case clang::X86::BI__builtin_ia32_maxss:
6044 case clang::X86::BI__builtin_ia32_maxsd:
6048 std::optional<APSInt> RoundingMode) -> std::optional<APFloat> {
6055 diag::note_invalid_subexpr_in_const_expr)
6061 llvm_unreachable(
"Unhandled builtin ID");