521 llvm::AtomicOrdering AO = llvm::AtomicOrdering::SequentiallyConsistent;
522 llvm::SyncScope::ID SSID;
524 case AMDGPU::BI__builtin_amdgcn_wave_reduce_add_u32:
525 case AMDGPU::BI__builtin_amdgcn_wave_reduce_fadd_f32:
526 case AMDGPU::BI__builtin_amdgcn_wave_reduce_fadd_f64:
527 case AMDGPU::BI__builtin_amdgcn_wave_reduce_sub_u32:
528 case AMDGPU::BI__builtin_amdgcn_wave_reduce_fsub_f32:
529 case AMDGPU::BI__builtin_amdgcn_wave_reduce_fsub_f64:
530 case AMDGPU::BI__builtin_amdgcn_wave_reduce_min_i32:
531 case AMDGPU::BI__builtin_amdgcn_wave_reduce_min_u32:
532 case AMDGPU::BI__builtin_amdgcn_wave_reduce_fmin_f32:
533 case AMDGPU::BI__builtin_amdgcn_wave_reduce_fmin_f64:
534 case AMDGPU::BI__builtin_amdgcn_wave_reduce_max_i32:
535 case AMDGPU::BI__builtin_amdgcn_wave_reduce_max_u32:
536 case AMDGPU::BI__builtin_amdgcn_wave_reduce_fmax_f32:
537 case AMDGPU::BI__builtin_amdgcn_wave_reduce_fmax_f64:
538 case AMDGPU::BI__builtin_amdgcn_wave_reduce_and_b32:
539 case AMDGPU::BI__builtin_amdgcn_wave_reduce_or_b32:
540 case AMDGPU::BI__builtin_amdgcn_wave_reduce_xor_b32:
541 case AMDGPU::BI__builtin_amdgcn_wave_reduce_add_u64:
542 case AMDGPU::BI__builtin_amdgcn_wave_reduce_sub_u64:
543 case AMDGPU::BI__builtin_amdgcn_wave_reduce_min_i64:
544 case AMDGPU::BI__builtin_amdgcn_wave_reduce_min_u64:
545 case AMDGPU::BI__builtin_amdgcn_wave_reduce_max_i64:
546 case AMDGPU::BI__builtin_amdgcn_wave_reduce_max_u64:
547 case AMDGPU::BI__builtin_amdgcn_wave_reduce_and_b64:
548 case AMDGPU::BI__builtin_amdgcn_wave_reduce_or_b64:
549 case AMDGPU::BI__builtin_amdgcn_wave_reduce_xor_b64: {
556 case AMDGPU::BI__builtin_amdgcn_div_scale:
557 case AMDGPU::BI__builtin_amdgcn_div_scalef: {
567 llvm::Function *Callee =
CGM.getIntrinsic(Intrinsic::amdgcn_div_scale,
570 llvm::Value *Tmp =
Builder.CreateCall(Callee, {
X, Y, Z});
573 llvm::Value *Flag =
Builder.CreateExtractValue(Tmp, 1);
577 llvm::Value *FlagExt =
Builder.CreateZExt(Flag, RealFlagType);
578 Builder.CreateStore(FlagExt, FlagOutPtr);
581 case AMDGPU::BI__builtin_amdgcn_div_fmas:
582 case AMDGPU::BI__builtin_amdgcn_div_fmasf: {
588 llvm::Function *F =
CGM.getIntrinsic(Intrinsic::amdgcn_div_fmas,
590 llvm::Value *Src3ToBool =
Builder.CreateIsNotNull(Src3);
591 return Builder.CreateCall(F, {Src0, Src1, Src2, Src3ToBool});
594 case AMDGPU::BI__builtin_amdgcn_ds_swizzle:
596 Intrinsic::amdgcn_ds_swizzle);
597 case AMDGPU::BI__builtin_amdgcn_mov_dpp8:
598 case AMDGPU::BI__builtin_amdgcn_mov_dpp:
599 case AMDGPU::BI__builtin_amdgcn_update_dpp: {
603 unsigned ICEArguments = 0;
608 unsigned Size = DataTy->getPrimitiveSizeInBits();
610 llvm::IntegerType::get(
Builder.getContext(), std::max(Size, 32u));
612 CGM.getIntrinsic(BuiltinID == AMDGPU::BI__builtin_amdgcn_mov_dpp8
613 ? Intrinsic::amdgcn_mov_dpp8
614 : Intrinsic::amdgcn_update_dpp,
618 bool InsertOld = BuiltinID == AMDGPU::BI__builtin_amdgcn_mov_dpp;
620 Args.push_back(llvm::PoisonValue::get(
IntTy));
621 for (
unsigned I = 0; I != E->
getNumArgs(); ++I) {
623 if (I < (BuiltinID == AMDGPU::BI__builtin_amdgcn_update_dpp ? 2u : 1u) &&
625 if (!DataTy->isIntegerTy())
627 V, llvm::IntegerType::get(
Builder.getContext(), Size));
631 F->getFunctionType()->getFunctionParamType(I + InsertOld);
632 Args.push_back(
Builder.CreateTruncOrBitCast(
V, ExpTy));
635 if (Size < 32 && !DataTy->isIntegerTy())
637 V, llvm::IntegerType::get(
Builder.getContext(), Size));
638 return Builder.CreateTruncOrBitCast(
V, DataTy);
640 case AMDGPU::BI__builtin_amdgcn_permlane16:
641 case AMDGPU::BI__builtin_amdgcn_permlanex16:
644 BuiltinID == AMDGPU::BI__builtin_amdgcn_permlane16
645 ? Intrinsic::amdgcn_permlane16
646 : Intrinsic::amdgcn_permlanex16);
647 case AMDGPU::BI__builtin_amdgcn_permlane64:
649 Intrinsic::amdgcn_permlane64);
650 case AMDGPU::BI__builtin_amdgcn_readlane:
652 Intrinsic::amdgcn_readlane);
653 case AMDGPU::BI__builtin_amdgcn_wave_shuffle:
655 Intrinsic::amdgcn_wave_shuffle);
656 case AMDGPU::BI__builtin_amdgcn_readfirstlane:
658 Intrinsic::amdgcn_readfirstlane);
659 case AMDGPU::BI__builtin_amdgcn_div_fixup:
660 case AMDGPU::BI__builtin_amdgcn_div_fixupf:
661 case AMDGPU::BI__builtin_amdgcn_div_fixuph:
663 Intrinsic::amdgcn_div_fixup);
664 case AMDGPU::BI__builtin_amdgcn_trig_preop:
665 case AMDGPU::BI__builtin_amdgcn_trig_preopf:
667 case AMDGPU::BI__builtin_amdgcn_rcp:
668 case AMDGPU::BI__builtin_amdgcn_rcpf:
669 case AMDGPU::BI__builtin_amdgcn_rcph:
670 case AMDGPU::BI__builtin_amdgcn_rcp_bf16:
672 case AMDGPU::BI__builtin_amdgcn_sqrt:
673 case AMDGPU::BI__builtin_amdgcn_sqrtf:
674 case AMDGPU::BI__builtin_amdgcn_sqrth:
675 case AMDGPU::BI__builtin_amdgcn_sqrt_bf16:
677 Intrinsic::amdgcn_sqrt);
678 case AMDGPU::BI__builtin_amdgcn_rsq:
679 case AMDGPU::BI__builtin_amdgcn_rsqf:
680 case AMDGPU::BI__builtin_amdgcn_rsqh:
681 case AMDGPU::BI__builtin_amdgcn_rsq_bf16:
683 case AMDGPU::BI__builtin_amdgcn_rsq_clamp:
684 case AMDGPU::BI__builtin_amdgcn_rsq_clampf:
686 Intrinsic::amdgcn_rsq_clamp);
687 case AMDGPU::BI__builtin_amdgcn_sinf:
688 case AMDGPU::BI__builtin_amdgcn_sinh:
689 case AMDGPU::BI__builtin_amdgcn_sin_bf16:
691 case AMDGPU::BI__builtin_amdgcn_cosf:
692 case AMDGPU::BI__builtin_amdgcn_cosh:
693 case AMDGPU::BI__builtin_amdgcn_cos_bf16:
695 case AMDGPU::BI__builtin_amdgcn_dispatch_ptr:
696 return EmitAMDGPUDispatchPtr(*
this, E);
697 case AMDGPU::BI__builtin_amdgcn_logf:
698 case AMDGPU::BI__builtin_amdgcn_log_bf16:
700 case AMDGPU::BI__builtin_amdgcn_exp2f:
701 case AMDGPU::BI__builtin_amdgcn_exp2_bf16:
703 Intrinsic::amdgcn_exp2);
704 case AMDGPU::BI__builtin_amdgcn_log_clampf:
706 Intrinsic::amdgcn_log_clamp);
707 case AMDGPU::BI__builtin_amdgcn_ldexp:
708 case AMDGPU::BI__builtin_amdgcn_ldexpf: {
712 CGM.getIntrinsic(Intrinsic::ldexp, {Src0->getType(), Src1->getType()});
713 return Builder.CreateCall(F, {Src0, Src1});
715 case AMDGPU::BI__builtin_amdgcn_ldexph: {
721 CGM.getIntrinsic(Intrinsic::ldexp, {Src0->getType(),
Int16Ty});
724 case AMDGPU::BI__builtin_amdgcn_frexp_mant:
725 case AMDGPU::BI__builtin_amdgcn_frexp_mantf:
726 case AMDGPU::BI__builtin_amdgcn_frexp_manth:
728 Intrinsic::amdgcn_frexp_mant);
729 case AMDGPU::BI__builtin_amdgcn_frexp_exp:
730 case AMDGPU::BI__builtin_amdgcn_frexp_expf: {
732 Function *F =
CGM.getIntrinsic(Intrinsic::amdgcn_frexp_exp,
734 return Builder.CreateCall(F, Src0);
736 case AMDGPU::BI__builtin_amdgcn_frexp_exph: {
738 Function *F =
CGM.getIntrinsic(Intrinsic::amdgcn_frexp_exp,
740 return Builder.CreateCall(F, Src0);
742 case AMDGPU::BI__builtin_amdgcn_fract:
743 case AMDGPU::BI__builtin_amdgcn_fractf:
744 case AMDGPU::BI__builtin_amdgcn_fracth:
746 Intrinsic::amdgcn_fract);
747 case AMDGPU::BI__builtin_amdgcn_lerp:
749 Intrinsic::amdgcn_lerp);
750 case AMDGPU::BI__builtin_amdgcn_ubfe:
752 Intrinsic::amdgcn_ubfe);
753 case AMDGPU::BI__builtin_amdgcn_sbfe:
755 Intrinsic::amdgcn_sbfe);
756 case AMDGPU::BI__builtin_amdgcn_ballot_w32:
757 case AMDGPU::BI__builtin_amdgcn_ballot_w64: {
760 Function *F =
CGM.getIntrinsic(Intrinsic::amdgcn_ballot, {ResultType});
761 return Builder.CreateCall(F, {Src});
763 case AMDGPU::BI__builtin_amdgcn_inverse_ballot_w32:
764 case AMDGPU::BI__builtin_amdgcn_inverse_ballot_w64: {
767 CGM.getIntrinsic(Intrinsic::amdgcn_inverse_ballot, {Src->getType()});
768 return Builder.CreateCall(F, {Src});
770 case AMDGPU::BI__builtin_amdgcn_tanhf:
771 case AMDGPU::BI__builtin_amdgcn_tanhh:
772 case AMDGPU::BI__builtin_amdgcn_tanh_bf16:
774 Intrinsic::amdgcn_tanh);
775 case AMDGPU::BI__builtin_amdgcn_uicmp:
776 case AMDGPU::BI__builtin_amdgcn_uicmpl:
777 case AMDGPU::BI__builtin_amdgcn_sicmp:
778 case AMDGPU::BI__builtin_amdgcn_sicmpl: {
784 Function *F =
CGM.getIntrinsic(Intrinsic::amdgcn_icmp,
785 {
Builder.getInt64Ty(), Src0->getType() });
786 return Builder.CreateCall(F, { Src0, Src1, Src2 });
788 case AMDGPU::BI__builtin_amdgcn_fcmp:
789 case AMDGPU::BI__builtin_amdgcn_fcmpf: {
795 Function *F =
CGM.getIntrinsic(Intrinsic::amdgcn_fcmp,
796 {
Builder.getInt64Ty(), Src0->getType() });
797 return Builder.CreateCall(F, { Src0, Src1, Src2 });
799 case AMDGPU::BI__builtin_amdgcn_class:
800 case AMDGPU::BI__builtin_amdgcn_classf:
801 case AMDGPU::BI__builtin_amdgcn_classh:
803 case AMDGPU::BI__builtin_amdgcn_fmed3f:
804 case AMDGPU::BI__builtin_amdgcn_fmed3h:
806 Intrinsic::amdgcn_fmed3);
807 case AMDGPU::BI__builtin_amdgcn_ds_append:
808 case AMDGPU::BI__builtin_amdgcn_ds_consume: {
809 Intrinsic::ID Intrin = BuiltinID == AMDGPU::BI__builtin_amdgcn_ds_append ?
810 Intrinsic::amdgcn_ds_append : Intrinsic::amdgcn_ds_consume;
815 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b64_i32:
816 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b64_v2i32:
817 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b128_v4i16:
818 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b128_v4f16:
819 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b128_v4bf16:
820 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b128_v8i16:
821 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b128_v8f16:
822 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b128_v8bf16:
823 case AMDGPU::BI__builtin_amdgcn_global_load_tr4_b64_v2i32:
824 case AMDGPU::BI__builtin_amdgcn_global_load_tr8_b64_v2i32:
825 case AMDGPU::BI__builtin_amdgcn_global_load_tr6_b96_v3i32:
826 case AMDGPU::BI__builtin_amdgcn_global_load_tr16_b128_v8i16:
827 case AMDGPU::BI__builtin_amdgcn_global_load_tr16_b128_v8f16:
828 case AMDGPU::BI__builtin_amdgcn_global_load_tr16_b128_v8bf16:
829 case AMDGPU::BI__builtin_amdgcn_ds_load_tr4_b64_v2i32:
830 case AMDGPU::BI__builtin_amdgcn_ds_load_tr8_b64_v2i32:
831 case AMDGPU::BI__builtin_amdgcn_ds_load_tr6_b96_v3i32:
832 case AMDGPU::BI__builtin_amdgcn_ds_load_tr16_b128_v8i16:
833 case AMDGPU::BI__builtin_amdgcn_ds_load_tr16_b128_v8f16:
834 case AMDGPU::BI__builtin_amdgcn_ds_load_tr16_b128_v8bf16:
835 case AMDGPU::BI__builtin_amdgcn_ds_read_tr4_b64_v2i32:
836 case AMDGPU::BI__builtin_amdgcn_ds_read_tr8_b64_v2i32:
837 case AMDGPU::BI__builtin_amdgcn_ds_read_tr6_b96_v3i32:
838 case AMDGPU::BI__builtin_amdgcn_ds_read_tr16_b64_v4f16:
839 case AMDGPU::BI__builtin_amdgcn_ds_read_tr16_b64_v4bf16:
840 case AMDGPU::BI__builtin_amdgcn_ds_read_tr16_b64_v4i16: {
843 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b64_i32:
844 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b64_v2i32:
845 case AMDGPU::BI__builtin_amdgcn_global_load_tr8_b64_v2i32:
846 IID = Intrinsic::amdgcn_global_load_tr_b64;
848 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b128_v4i16:
849 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b128_v4f16:
850 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b128_v4bf16:
851 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b128_v8i16:
852 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b128_v8f16:
853 case AMDGPU::BI__builtin_amdgcn_global_load_tr_b128_v8bf16:
854 case AMDGPU::BI__builtin_amdgcn_global_load_tr16_b128_v8i16:
855 case AMDGPU::BI__builtin_amdgcn_global_load_tr16_b128_v8f16:
856 case AMDGPU::BI__builtin_amdgcn_global_load_tr16_b128_v8bf16:
857 IID = Intrinsic::amdgcn_global_load_tr_b128;
859 case AMDGPU::BI__builtin_amdgcn_global_load_tr4_b64_v2i32:
860 IID = Intrinsic::amdgcn_global_load_tr4_b64;
862 case AMDGPU::BI__builtin_amdgcn_global_load_tr6_b96_v3i32:
863 IID = Intrinsic::amdgcn_global_load_tr6_b96;
865 case AMDGPU::BI__builtin_amdgcn_ds_load_tr4_b64_v2i32:
866 IID = Intrinsic::amdgcn_ds_load_tr4_b64;
868 case AMDGPU::BI__builtin_amdgcn_ds_load_tr6_b96_v3i32:
869 IID = Intrinsic::amdgcn_ds_load_tr6_b96;
871 case AMDGPU::BI__builtin_amdgcn_ds_load_tr8_b64_v2i32:
872 IID = Intrinsic::amdgcn_ds_load_tr8_b64;
874 case AMDGPU::BI__builtin_amdgcn_ds_load_tr16_b128_v8i16:
875 case AMDGPU::BI__builtin_amdgcn_ds_load_tr16_b128_v8f16:
876 case AMDGPU::BI__builtin_amdgcn_ds_load_tr16_b128_v8bf16:
877 IID = Intrinsic::amdgcn_ds_load_tr16_b128;
879 case AMDGPU::BI__builtin_amdgcn_ds_read_tr4_b64_v2i32:
880 IID = Intrinsic::amdgcn_ds_read_tr4_b64;
882 case AMDGPU::BI__builtin_amdgcn_ds_read_tr8_b64_v2i32:
883 IID = Intrinsic::amdgcn_ds_read_tr8_b64;
885 case AMDGPU::BI__builtin_amdgcn_ds_read_tr6_b96_v3i32:
886 IID = Intrinsic::amdgcn_ds_read_tr6_b96;
888 case AMDGPU::BI__builtin_amdgcn_ds_read_tr16_b64_v4i16:
889 case AMDGPU::BI__builtin_amdgcn_ds_read_tr16_b64_v4f16:
890 case AMDGPU::BI__builtin_amdgcn_ds_read_tr16_b64_v4bf16:
891 IID = Intrinsic::amdgcn_ds_read_tr16_b64;
896 llvm::Function *F =
CGM.getIntrinsic(IID, {LoadTy});
899 case AMDGPU::BI__builtin_amdgcn_global_load_monitor_b32:
900 case AMDGPU::BI__builtin_amdgcn_global_load_monitor_b64:
901 case AMDGPU::BI__builtin_amdgcn_global_load_monitor_b128:
902 case AMDGPU::BI__builtin_amdgcn_flat_load_monitor_b32:
903 case AMDGPU::BI__builtin_amdgcn_flat_load_monitor_b64:
904 case AMDGPU::BI__builtin_amdgcn_flat_load_monitor_b128: {
908 case AMDGPU::BI__builtin_amdgcn_global_load_monitor_b32:
909 IID = Intrinsic::amdgcn_global_load_monitor_b32;
911 case AMDGPU::BI__builtin_amdgcn_global_load_monitor_b64:
912 IID = Intrinsic::amdgcn_global_load_monitor_b64;
914 case AMDGPU::BI__builtin_amdgcn_global_load_monitor_b128:
915 IID = Intrinsic::amdgcn_global_load_monitor_b128;
917 case AMDGPU::BI__builtin_amdgcn_flat_load_monitor_b32:
918 IID = Intrinsic::amdgcn_flat_load_monitor_b32;
920 case AMDGPU::BI__builtin_amdgcn_flat_load_monitor_b64:
921 IID = Intrinsic::amdgcn_flat_load_monitor_b64;
923 case AMDGPU::BI__builtin_amdgcn_flat_load_monitor_b128:
924 IID = Intrinsic::amdgcn_flat_load_monitor_b128;
935 llvm::Value *ScopeMD =
emitScopeMD(*
this, ScopeExpr->getZExtValue(), AO);
936 llvm::Function *F =
CGM.getIntrinsic(IID, {LoadTy});
937 return Builder.CreateCall(F, {
Addr, AOExpr, ScopeMD});
939 case AMDGPU::BI__builtin_amdgcn_cluster_load_b32:
940 case AMDGPU::BI__builtin_amdgcn_cluster_load_b64:
941 case AMDGPU::BI__builtin_amdgcn_cluster_load_b128: {
944 case AMDGPU::BI__builtin_amdgcn_cluster_load_b32:
945 IID = Intrinsic::amdgcn_cluster_load_b32;
947 case AMDGPU::BI__builtin_amdgcn_cluster_load_b64:
948 IID = Intrinsic::amdgcn_cluster_load_b64;
950 case AMDGPU::BI__builtin_amdgcn_cluster_load_b128:
951 IID = Intrinsic::amdgcn_cluster_load_b128;
955 for (
int i = 0, e = E->
getNumArgs(); i != e; ++i)
958 return Builder.CreateCall(F, {Args});
960 case AMDGPU::BI__builtin_amdgcn_load_to_lds: {
963 Intrinsic::amdgcn_load_to_lds);
965 case AMDGPU::BI__builtin_amdgcn_load_async_to_lds: {
968 *
this, E, Intrinsic::amdgcn_load_async_to_lds);
970 case AMDGPU::BI__builtin_amdgcn_cooperative_atomic_load_32x4B:
971 case AMDGPU::BI__builtin_amdgcn_cooperative_atomic_store_32x4B:
972 case AMDGPU::BI__builtin_amdgcn_cooperative_atomic_load_16x8B:
973 case AMDGPU::BI__builtin_amdgcn_cooperative_atomic_store_16x8B:
974 case AMDGPU::BI__builtin_amdgcn_cooperative_atomic_load_8x16B:
975 case AMDGPU::BI__builtin_amdgcn_cooperative_atomic_store_8x16B: {
978 case AMDGPU::BI__builtin_amdgcn_cooperative_atomic_load_32x4B:
979 IID = Intrinsic::amdgcn_cooperative_atomic_load_32x4B;
981 case AMDGPU::BI__builtin_amdgcn_cooperative_atomic_store_32x4B:
982 IID = Intrinsic::amdgcn_cooperative_atomic_store_32x4B;
984 case AMDGPU::BI__builtin_amdgcn_cooperative_atomic_load_16x8B:
985 IID = Intrinsic::amdgcn_cooperative_atomic_load_16x8B;
987 case AMDGPU::BI__builtin_amdgcn_cooperative_atomic_store_16x8B:
988 IID = Intrinsic::amdgcn_cooperative_atomic_store_16x8B;
990 case AMDGPU::BI__builtin_amdgcn_cooperative_atomic_load_8x16B:
991 IID = Intrinsic::amdgcn_cooperative_atomic_load_8x16B;
993 case AMDGPU::BI__builtin_amdgcn_cooperative_atomic_store_8x16B:
994 IID = Intrinsic::amdgcn_cooperative_atomic_store_8x16B;
998 LLVMContext &Ctx =
CGM.getLLVMContext();
1001 const unsigned ScopeArg = E->
getNumArgs() - 1;
1002 for (
unsigned i = 0; i != ScopeArg; ++i)
1006 llvm::MDNode *MD = llvm::MDNode::get(Ctx, {llvm::MDString::get(Ctx, Arg)});
1007 Args.push_back(llvm::MetadataAsValue::get(Ctx, MD));
1010 llvm::Function *F =
CGM.getIntrinsic(IID, {Args[0]->getType()});
1011 return Builder.CreateCall(F, {Args});
1013 case AMDGPU::BI__builtin_amdgcn_av_load_b128:
1014 case AMDGPU::BI__builtin_amdgcn_av_store_b128: {
1015 const bool IsStore = BuiltinID == AMDGPU::BI__builtin_amdgcn_av_store_b128;
1019 const unsigned ScopeIdx = E->
getNumArgs() - 1;
1022 Args.push_back(
emitScopeMD(*
this, ScopeExpr->getZExtValue()));
1024 CGM.getIntrinsic(IsStore ? Intrinsic::amdgcn_av_store_b128
1025 : Intrinsic::amdgcn_av_load_b128,
1026 {Args[0]->getType()});
1027 return Builder.CreateCall(F, Args);
1029 case AMDGPU::BI__builtin_amdgcn_get_fpenv: {
1030 Function *F =
CGM.getIntrinsic(Intrinsic::get_fpenv,
1034 case AMDGPU::BI__builtin_amdgcn_set_fpenv: {
1035 Function *F =
CGM.getIntrinsic(Intrinsic::set_fpenv,
1038 return Builder.CreateCall(F, {Env});
1040 case AMDGPU::BI__builtin_amdgcn_processor_is: {
1041 assert(
CGM.getTriple().isSPIRV() &&
1042 "__builtin_amdgcn_processor_is should never reach CodeGen for "
1043 "concrete targets!");
1047 case AMDGPU::BI__builtin_amdgcn_is_invocable: {
1048 assert(
CGM.getTriple().isSPIRV() &&
1049 "__builtin_amdgcn_is_invocable should never reach CodeGen for "
1050 "concrete targets!");
1057 case AMDGPU::BI__builtin_amdgcn_read_exec:
1059 case AMDGPU::BI__builtin_amdgcn_read_exec_lo:
1061 case AMDGPU::BI__builtin_amdgcn_read_exec_hi:
1063 case AMDGPU::BI__builtin_amdgcn_image_bvh_intersect_ray:
1064 case AMDGPU::BI__builtin_amdgcn_image_bvh_intersect_ray_h:
1065 case AMDGPU::BI__builtin_amdgcn_image_bvh_intersect_ray_l:
1066 case AMDGPU::BI__builtin_amdgcn_image_bvh_intersect_ray_lh: {
1076 RayOrigin =
Builder.CreateShuffleVector(RayOrigin, RayOrigin,
1079 Builder.CreateShuffleVector(RayDir, RayDir, {0, 1, 2});
1080 RayInverseDir =
Builder.CreateShuffleVector(RayInverseDir, RayInverseDir,
1083 Function *F =
CGM.getIntrinsic(Intrinsic::amdgcn_image_bvh_intersect_ray,
1084 {NodePtr->getType(), RayDir->getType()});
1085 return Builder.CreateCall(F, {NodePtr, RayExtent, RayOrigin, RayDir,
1086 RayInverseDir, TextureDescr});
1088 case AMDGPU::BI__builtin_amdgcn_image_bvh8_intersect_ray:
1089 case AMDGPU::BI__builtin_amdgcn_image_bvh_dual_intersect_ray: {
1091 switch (BuiltinID) {
1092 case AMDGPU::BI__builtin_amdgcn_image_bvh8_intersect_ray:
1093 IID = Intrinsic::amdgcn_image_bvh8_intersect_ray;
1095 case AMDGPU::BI__builtin_amdgcn_image_bvh_dual_intersect_ray:
1096 IID = Intrinsic::amdgcn_image_bvh_dual_intersect_ray;
1110 llvm::Function *IntrinsicFunc =
CGM.getIntrinsic(IID);
1112 llvm::CallInst *CI =
Builder.CreateCall(
1113 IntrinsicFunc, {NodePtr, RayExtent, InstanceMask, RayOrigin, RayDir,
1114 Offset, TextureDescr});
1116 llvm::Value *RetVData =
Builder.CreateExtractValue(CI, 0);
1117 llvm::Value *RetRayOrigin =
Builder.CreateExtractValue(CI, 1);
1118 llvm::Value *RetRayDir =
Builder.CreateExtractValue(CI, 2);
1120 Builder.CreateStore(RetRayOrigin, RetRayOriginPtr);
1121 Builder.CreateStore(RetRayDir, RetRayDirPtr);
1126 case AMDGPU::BI__builtin_amdgcn_ds_bvh_stack_rtn:
1127 case AMDGPU::BI__builtin_amdgcn_ds_bvh_stack_push4_pop1_rtn:
1128 case AMDGPU::BI__builtin_amdgcn_ds_bvh_stack_push8_pop1_rtn:
1129 case AMDGPU::BI__builtin_amdgcn_ds_bvh_stack_push8_pop2_rtn: {
1131 switch (BuiltinID) {
1132 case AMDGPU::BI__builtin_amdgcn_ds_bvh_stack_rtn:
1133 IID = Intrinsic::amdgcn_ds_bvh_stack_rtn;
1135 case AMDGPU::BI__builtin_amdgcn_ds_bvh_stack_push4_pop1_rtn:
1136 IID = Intrinsic::amdgcn_ds_bvh_stack_push4_pop1_rtn;
1138 case AMDGPU::BI__builtin_amdgcn_ds_bvh_stack_push8_pop1_rtn:
1139 IID = Intrinsic::amdgcn_ds_bvh_stack_push8_pop1_rtn;
1141 case AMDGPU::BI__builtin_amdgcn_ds_bvh_stack_push8_pop2_rtn:
1142 IID = Intrinsic::amdgcn_ds_bvh_stack_push8_pop2_rtn;
1147 for (
int i = 0, e = E->
getNumArgs(); i != e; ++i)
1155 Value *I0 =
Builder.CreateInsertElement(PoisonValue::get(RetTy), Rtn,
1159 if (A->
getType()->getPrimitiveSizeInBits() <
1160 RetTy->getScalarType()->getPrimitiveSizeInBits())
1161 A =
Builder.CreateZExt(A, RetTy->getScalarType());
1163 return Builder.CreateInsertElement(I0, A, 1);
1165 case AMDGPU::BI__builtin_amdgcn_image_load_1d_v4f32_i32:
1166 case AMDGPU::BI__builtin_amdgcn_image_load_1d_v4f16_i32:
1168 *
this, E, Intrinsic::amdgcn_image_load_1d,
false);
1169 case AMDGPU::BI__builtin_amdgcn_image_load_1darray_v4f32_i32:
1170 case AMDGPU::BI__builtin_amdgcn_image_load_1darray_v4f16_i32:
1172 *
this, E, Intrinsic::amdgcn_image_load_1darray,
false);
1173 case AMDGPU::BI__builtin_amdgcn_image_load_2d_f32_i32:
1174 case AMDGPU::BI__builtin_amdgcn_image_load_2d_v4f32_i32:
1175 case AMDGPU::BI__builtin_amdgcn_image_load_2d_v4f16_i32:
1177 *
this, E, Intrinsic::amdgcn_image_load_2d,
false);
1178 case AMDGPU::BI__builtin_amdgcn_image_load_2darray_f32_i32:
1179 case AMDGPU::BI__builtin_amdgcn_image_load_2darray_v4f32_i32:
1180 case AMDGPU::BI__builtin_amdgcn_image_load_2darray_v4f16_i32:
1182 *
this, E, Intrinsic::amdgcn_image_load_2darray,
false);
1183 case AMDGPU::BI__builtin_amdgcn_image_load_3d_v4f32_i32:
1184 case AMDGPU::BI__builtin_amdgcn_image_load_3d_v4f16_i32:
1186 *
this, E, Intrinsic::amdgcn_image_load_3d,
false);
1187 case AMDGPU::BI__builtin_amdgcn_image_load_cube_v4f32_i32:
1188 case AMDGPU::BI__builtin_amdgcn_image_load_cube_v4f16_i32:
1190 *
this, E, Intrinsic::amdgcn_image_load_cube,
false);
1191 case AMDGPU::BI__builtin_amdgcn_image_load_mip_1d_v4f32_i32:
1192 case AMDGPU::BI__builtin_amdgcn_image_load_mip_1d_v4f16_i32:
1194 *
this, E, Intrinsic::amdgcn_image_load_mip_1d,
false);
1195 case AMDGPU::BI__builtin_amdgcn_image_load_mip_1darray_v4f32_i32:
1196 case AMDGPU::BI__builtin_amdgcn_image_load_mip_1darray_v4f16_i32:
1198 *
this, E, Intrinsic::amdgcn_image_load_mip_1darray,
false);
1199 case AMDGPU::BI__builtin_amdgcn_image_load_mip_2d_f32_i32:
1200 case AMDGPU::BI__builtin_amdgcn_image_load_mip_2d_v4f32_i32:
1201 case AMDGPU::BI__builtin_amdgcn_image_load_mip_2d_v4f16_i32:
1203 *
this, E, Intrinsic::amdgcn_image_load_mip_2d,
false);
1204 case AMDGPU::BI__builtin_amdgcn_image_load_mip_2darray_f32_i32:
1205 case AMDGPU::BI__builtin_amdgcn_image_load_mip_2darray_v4f32_i32:
1206 case AMDGPU::BI__builtin_amdgcn_image_load_mip_2darray_v4f16_i32:
1208 *
this, E, Intrinsic::amdgcn_image_load_mip_2darray,
false);
1209 case AMDGPU::BI__builtin_amdgcn_image_load_mip_3d_v4f32_i32:
1210 case AMDGPU::BI__builtin_amdgcn_image_load_mip_3d_v4f16_i32:
1212 *
this, E, Intrinsic::amdgcn_image_load_mip_3d,
false);
1213 case AMDGPU::BI__builtin_amdgcn_image_load_mip_cube_v4f32_i32:
1214 case AMDGPU::BI__builtin_amdgcn_image_load_mip_cube_v4f16_i32:
1216 *
this, E, Intrinsic::amdgcn_image_load_mip_cube,
false);
1217 case AMDGPU::BI__builtin_amdgcn_image_store_1d_v4f32_i32:
1218 case AMDGPU::BI__builtin_amdgcn_image_store_1d_v4f16_i32:
1220 *
this, E, Intrinsic::amdgcn_image_store_1d,
true);
1221 case AMDGPU::BI__builtin_amdgcn_image_store_1darray_v4f32_i32:
1222 case AMDGPU::BI__builtin_amdgcn_image_store_1darray_v4f16_i32:
1224 *
this, E, Intrinsic::amdgcn_image_store_1darray,
true);
1225 case AMDGPU::BI__builtin_amdgcn_image_store_2d_f32_i32:
1226 case AMDGPU::BI__builtin_amdgcn_image_store_2d_v4f32_i32:
1227 case AMDGPU::BI__builtin_amdgcn_image_store_2d_v4f16_i32:
1229 *
this, E, Intrinsic::amdgcn_image_store_2d,
true);
1230 case AMDGPU::BI__builtin_amdgcn_image_store_2darray_f32_i32:
1231 case AMDGPU::BI__builtin_amdgcn_image_store_2darray_v4f32_i32:
1232 case AMDGPU::BI__builtin_amdgcn_image_store_2darray_v4f16_i32:
1234 *
this, E, Intrinsic::amdgcn_image_store_2darray,
true);
1235 case AMDGPU::BI__builtin_amdgcn_image_store_3d_v4f32_i32:
1236 case AMDGPU::BI__builtin_amdgcn_image_store_3d_v4f16_i32:
1238 *
this, E, Intrinsic::amdgcn_image_store_3d,
true);
1239 case AMDGPU::BI__builtin_amdgcn_image_store_cube_v4f32_i32:
1240 case AMDGPU::BI__builtin_amdgcn_image_store_cube_v4f16_i32:
1242 *
this, E, Intrinsic::amdgcn_image_store_cube,
true);
1243 case AMDGPU::BI__builtin_amdgcn_image_store_mip_1d_v4f32_i32:
1244 case AMDGPU::BI__builtin_amdgcn_image_store_mip_1d_v4f16_i32:
1246 *
this, E, Intrinsic::amdgcn_image_store_mip_1d,
true);
1247 case AMDGPU::BI__builtin_amdgcn_image_store_mip_1darray_v4f32_i32:
1248 case AMDGPU::BI__builtin_amdgcn_image_store_mip_1darray_v4f16_i32:
1250 *
this, E, Intrinsic::amdgcn_image_store_mip_1darray,
true);
1251 case AMDGPU::BI__builtin_amdgcn_image_store_mip_2d_f32_i32:
1252 case AMDGPU::BI__builtin_amdgcn_image_store_mip_2d_v4f32_i32:
1253 case AMDGPU::BI__builtin_amdgcn_image_store_mip_2d_v4f16_i32:
1255 *
this, E, Intrinsic::amdgcn_image_store_mip_2d,
true);
1256 case AMDGPU::BI__builtin_amdgcn_image_store_mip_2darray_f32_i32:
1257 case AMDGPU::BI__builtin_amdgcn_image_store_mip_2darray_v4f32_i32:
1258 case AMDGPU::BI__builtin_amdgcn_image_store_mip_2darray_v4f16_i32:
1260 *
this, E, Intrinsic::amdgcn_image_store_mip_2darray,
true);
1261 case AMDGPU::BI__builtin_amdgcn_image_store_mip_3d_v4f32_i32:
1262 case AMDGPU::BI__builtin_amdgcn_image_store_mip_3d_v4f16_i32:
1264 *
this, E, Intrinsic::amdgcn_image_store_mip_3d,
true);
1265 case AMDGPU::BI__builtin_amdgcn_image_store_mip_cube_v4f32_i32:
1266 case AMDGPU::BI__builtin_amdgcn_image_store_mip_cube_v4f16_i32:
1268 *
this, E, Intrinsic::amdgcn_image_store_mip_cube,
true);
1269 case AMDGPU::BI__builtin_amdgcn_image_sample_1d_v4f32_f32:
1270 case AMDGPU::BI__builtin_amdgcn_image_sample_1d_v4f16_f32:
1272 *
this, E, Intrinsic::amdgcn_image_sample_1d,
false);
1273 case AMDGPU::BI__builtin_amdgcn_image_sample_1darray_v4f32_f32:
1274 case AMDGPU::BI__builtin_amdgcn_image_sample_1darray_v4f16_f32:
1276 *
this, E, Intrinsic::amdgcn_image_sample_1darray,
false);
1277 case AMDGPU::BI__builtin_amdgcn_image_sample_2d_f32_f32:
1278 case AMDGPU::BI__builtin_amdgcn_image_sample_2d_v4f32_f32:
1279 case AMDGPU::BI__builtin_amdgcn_image_sample_2d_v4f16_f32:
1281 *
this, E, Intrinsic::amdgcn_image_sample_2d,
false);
1282 case AMDGPU::BI__builtin_amdgcn_image_sample_2darray_f32_f32:
1283 case AMDGPU::BI__builtin_amdgcn_image_sample_2darray_v4f32_f32:
1284 case AMDGPU::BI__builtin_amdgcn_image_sample_2darray_v4f16_f32:
1286 *
this, E, Intrinsic::amdgcn_image_sample_2darray,
false);
1287 case AMDGPU::BI__builtin_amdgcn_image_sample_3d_v4f32_f32:
1288 case AMDGPU::BI__builtin_amdgcn_image_sample_3d_v4f16_f32:
1290 *
this, E, Intrinsic::amdgcn_image_sample_3d,
false);
1291 case AMDGPU::BI__builtin_amdgcn_image_sample_cube_v4f32_f32:
1292 case AMDGPU::BI__builtin_amdgcn_image_sample_cube_v4f16_f32:
1294 *
this, E, Intrinsic::amdgcn_image_sample_cube,
false);
1295 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_lz_1d_v4f32_f32:
1296 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_lz_1d_v4f16_f32:
1298 *
this, E, Intrinsic::amdgcn_image_sample_lz_1d,
false);
1299 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_l_1d_v4f32_f32:
1300 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_l_1d_v4f16_f32:
1302 *
this, E, Intrinsic::amdgcn_image_sample_l_1d,
false);
1303 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_d_1d_v4f32_f32:
1304 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_d_1d_v4f16_f32:
1306 *
this, E, Intrinsic::amdgcn_image_sample_d_1d,
false);
1307 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_lz_2d_v4f32_f32:
1308 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_lz_2d_v4f16_f32:
1309 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_lz_2d_f32_f32:
1311 *
this, E, Intrinsic::amdgcn_image_sample_lz_2d,
false);
1312 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_l_2d_v4f32_f32:
1313 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_l_2d_v4f16_f32:
1314 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_l_2d_f32_f32:
1316 *
this, E, Intrinsic::amdgcn_image_sample_l_2d,
false);
1317 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_d_2d_v4f32_f32:
1318 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_d_2d_v4f16_f32:
1319 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_d_2d_f32_f32:
1321 *
this, E, Intrinsic::amdgcn_image_sample_d_2d,
false);
1322 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_lz_3d_v4f32_f32:
1323 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_lz_3d_v4f16_f32:
1325 *
this, E, Intrinsic::amdgcn_image_sample_lz_3d,
false);
1326 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_l_3d_v4f32_f32:
1327 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_l_3d_v4f16_f32:
1329 *
this, E, Intrinsic::amdgcn_image_sample_l_3d,
false);
1330 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_d_3d_v4f32_f32:
1331 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_d_3d_v4f16_f32:
1333 *
this, E, Intrinsic::amdgcn_image_sample_d_3d,
false);
1334 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_lz_cube_v4f32_f32:
1335 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_lz_cube_v4f16_f32:
1337 *
this, E, Intrinsic::amdgcn_image_sample_lz_cube,
false);
1338 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_l_cube_v4f32_f32:
1339 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_l_cube_v4f16_f32:
1341 *
this, E, Intrinsic::amdgcn_image_sample_l_cube,
false);
1342 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_lz_1darray_v4f32_f32:
1343 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_lz_1darray_v4f16_f32:
1345 *
this, E, Intrinsic::amdgcn_image_sample_lz_1darray,
false);
1346 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_l_1darray_v4f32_f32:
1347 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_l_1darray_v4f16_f32:
1349 *
this, E, Intrinsic::amdgcn_image_sample_l_1darray,
false);
1350 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_d_1darray_v4f32_f32:
1351 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_d_1darray_v4f16_f32:
1353 *
this, E, Intrinsic::amdgcn_image_sample_d_1darray,
false);
1354 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_lz_2darray_v4f32_f32:
1355 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_lz_2darray_v4f16_f32:
1356 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_lz_2darray_f32_f32:
1358 *
this, E, Intrinsic::amdgcn_image_sample_lz_2darray,
false);
1359 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_l_2darray_v4f32_f32:
1360 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_l_2darray_v4f16_f32:
1361 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_l_2darray_f32_f32:
1363 *
this, E, Intrinsic::amdgcn_image_sample_l_2darray,
false);
1364 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_d_2darray_v4f32_f32:
1365 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_d_2darray_v4f16_f32:
1366 case clang::AMDGPU::BI__builtin_amdgcn_image_sample_d_2darray_f32_f32:
1368 *
this, E, Intrinsic::amdgcn_image_sample_d_2darray,
false);
1369 case clang::AMDGPU::BI__builtin_amdgcn_image_gather4_lz_2d_v4f32_f32:
1371 *
this, E, Intrinsic::amdgcn_image_gather4_lz_2d,
false);
1372 case AMDGPU::BI__builtin_amdgcn_mfma_scale_f32_16x16x128_f8f6f4:
1373 case AMDGPU::BI__builtin_amdgcn_mfma_scale_f32_32x32x64_f8f6f4: {
1374 llvm::FixedVectorType *VT = FixedVectorType::get(
Builder.getInt32Ty(), 8);
1376 BuiltinID == AMDGPU::BI__builtin_amdgcn_mfma_scale_f32_32x32x64_f8f6f4
1377 ? Intrinsic::amdgcn_mfma_scale_f32_32x32x64_f8f6f4
1378 : Intrinsic::amdgcn_mfma_scale_f32_16x16x128_f8f6f4,
1382 for (
unsigned I = 0, N = E->
getNumArgs(); I != N; ++I)
1384 return Builder.CreateCall(F, Args);
1386 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_w32:
1387 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_tied_w32:
1388 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_w64:
1389 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_tied_w64:
1390 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_w32:
1391 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_tied_w32:
1392 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_w64:
1393 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_tied_w64:
1394 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf16_w32:
1395 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf16_w64:
1396 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_f16_w32:
1397 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_f16_w64:
1398 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu4_w32:
1399 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu4_w64:
1400 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu8_w32:
1401 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu8_w64:
1402 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_w32_gfx12:
1403 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_w64_gfx12:
1404 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_w32_gfx12:
1405 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_w64_gfx12:
1406 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf16_w32_gfx12:
1407 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf16_w64_gfx12:
1408 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_f16_w32_gfx12:
1409 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_f16_w64_gfx12:
1410 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu4_w32_gfx12:
1411 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu4_w64_gfx12:
1412 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu8_w32_gfx12:
1413 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu8_w64_gfx12:
1414 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_fp8_fp8_w32_gfx12:
1415 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_fp8_fp8_w64_gfx12:
1416 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_fp8_bf8_w32_gfx12:
1417 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_fp8_bf8_w64_gfx12:
1418 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf8_fp8_w32_gfx12:
1419 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf8_fp8_w64_gfx12:
1420 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf8_bf8_w32_gfx12:
1421 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf8_bf8_w64_gfx12:
1422 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x32_iu4_w32_gfx12:
1423 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x32_iu4_w64_gfx12:
1424 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_f16_w32:
1425 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_f16_w64:
1426 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_bf16_w32:
1427 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_bf16_w64:
1428 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x32_f16_w32:
1429 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x32_f16_w64:
1430 case AMDGPU::BI__builtin_amdgcn_swmmac_bf16_16x16x32_bf16_w32:
1431 case AMDGPU::BI__builtin_amdgcn_swmmac_bf16_16x16x32_bf16_w64:
1432 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x32_iu8_w32:
1433 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x32_iu8_w64:
1434 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x32_iu4_w32:
1435 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x32_iu4_w64:
1436 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x64_iu4_w32:
1437 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x64_iu4_w64:
1438 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_fp8_fp8_w32:
1439 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_fp8_fp8_w64:
1440 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_fp8_bf8_w32:
1441 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_fp8_bf8_w64:
1442 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_bf8_fp8_w32:
1443 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_bf8_fp8_w64:
1444 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_bf8_bf8_w32:
1445 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_bf8_bf8_w64:
1447 case AMDGPU::BI__builtin_amdgcn_wmma_f64_16x16x4_f64:
1448 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x4_f32:
1449 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x32_bf16:
1450 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x32_f16:
1451 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x32_f16:
1452 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x32_bf16:
1453 case AMDGPU::BI__builtin_amdgcn_wmma_bf16f32_16x16x32_bf16:
1454 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x64_fp8_fp8:
1455 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x64_fp8_bf8:
1456 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x64_bf8_fp8:
1457 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x64_bf8_bf8:
1458 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x64_fp8_fp8:
1459 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x64_fp8_bf8:
1460 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x64_bf8_fp8:
1461 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x64_bf8_bf8:
1462 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x128_fp8_fp8:
1463 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x128_fp8_bf8:
1464 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x128_bf8_fp8:
1465 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x128_bf8_bf8:
1466 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x128_fp8_fp8:
1467 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x128_fp8_bf8:
1468 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x128_bf8_fp8:
1469 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x128_bf8_bf8:
1470 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x64_iu8:
1471 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x128_f8f6f4:
1472 case AMDGPU::BI__builtin_amdgcn_wmma_f32_32x16x128_f4:
1473 case AMDGPU::BI__builtin_amdgcn_wmma_scale_f32_16x16x128_f8f6f4:
1474 case AMDGPU::BI__builtin_amdgcn_wmma_scale16_f32_16x16x128_f8f6f4:
1475 case AMDGPU::BI__builtin_amdgcn_wmma_scale_f32_32x16x128_f4:
1476 case AMDGPU::BI__builtin_amdgcn_wmma_scale16_f32_32x16x128_f4:
1477 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x64_f16:
1478 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x64_bf16:
1479 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x64_f16:
1480 case AMDGPU::BI__builtin_amdgcn_swmmac_bf16_16x16x64_bf16:
1481 case AMDGPU::BI__builtin_amdgcn_swmmac_bf16f32_16x16x64_bf16:
1482 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x128_fp8_fp8:
1483 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x128_fp8_bf8:
1484 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x128_bf8_fp8:
1485 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x128_bf8_bf8:
1486 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x128_fp8_fp8:
1487 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x128_fp8_bf8:
1488 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x128_bf8_fp8:
1489 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x128_bf8_bf8:
1490 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x128_iu8: {
1503 bool AppendFalseForOpselArg =
false;
1504 unsigned BuiltinWMMAOp;
1506 bool NeedReturnType =
false;
1508 bool RemoveABNeg =
false;
1510 switch (BuiltinID) {
1511 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_f16_w32:
1512 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_f16_w64:
1513 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_f16_w32_gfx12:
1514 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_f16_w64_gfx12:
1515 ArgsForMatchingMatrixTypes = {2, 0};
1516 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f32_16x16x16_f16;
1518 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf16_w32:
1519 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf16_w64:
1520 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf16_w32_gfx12:
1521 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf16_w64_gfx12:
1522 ArgsForMatchingMatrixTypes = {2, 0};
1523 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f32_16x16x16_bf16;
1525 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_w32_gfx12:
1526 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_w64_gfx12:
1527 AppendFalseForOpselArg =
true;
1529 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_w32:
1530 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_w64:
1531 ArgsForMatchingMatrixTypes = {2, 0};
1532 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f16_16x16x16_f16;
1534 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_w32_gfx12:
1535 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_w64_gfx12:
1536 AppendFalseForOpselArg =
true;
1538 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_w32:
1539 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_w64:
1540 ArgsForMatchingMatrixTypes = {2, 0};
1541 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_bf16_16x16x16_bf16;
1543 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_tied_w32:
1544 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x16_f16_tied_w64:
1545 ArgsForMatchingMatrixTypes = {2, 0};
1546 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f16_16x16x16_f16_tied;
1548 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_tied_w32:
1549 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x16_bf16_tied_w64:
1550 ArgsForMatchingMatrixTypes = {2, 0};
1551 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_bf16_16x16x16_bf16_tied;
1553 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu8_w32:
1554 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu8_w64:
1555 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu8_w32_gfx12:
1556 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu8_w64_gfx12:
1557 ArgsForMatchingMatrixTypes = {4, 1};
1558 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_i32_16x16x16_iu8;
1560 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu4_w32:
1561 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu4_w64:
1562 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu4_w32_gfx12:
1563 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x16_iu4_w64_gfx12:
1564 ArgsForMatchingMatrixTypes = {4, 1};
1565 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_i32_16x16x16_iu4;
1567 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_fp8_fp8_w32_gfx12:
1568 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_fp8_fp8_w64_gfx12:
1569 ArgsForMatchingMatrixTypes = {2, 0};
1570 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f32_16x16x16_fp8_fp8;
1572 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_fp8_bf8_w32_gfx12:
1573 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_fp8_bf8_w64_gfx12:
1574 ArgsForMatchingMatrixTypes = {2, 0};
1575 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f32_16x16x16_fp8_bf8;
1577 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf8_fp8_w32_gfx12:
1578 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf8_fp8_w64_gfx12:
1579 ArgsForMatchingMatrixTypes = {2, 0};
1580 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f32_16x16x16_bf8_fp8;
1582 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf8_bf8_w32_gfx12:
1583 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x16_bf8_bf8_w64_gfx12:
1584 ArgsForMatchingMatrixTypes = {2, 0};
1585 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f32_16x16x16_bf8_bf8;
1587 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x32_iu4_w32_gfx12:
1588 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x32_iu4_w64_gfx12:
1589 ArgsForMatchingMatrixTypes = {4, 1};
1590 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_i32_16x16x32_iu4;
1592 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_f16_w32:
1593 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_f16_w64:
1594 ArgsForMatchingMatrixTypes = {2, 0, 1, 3};
1595 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_f32_16x16x32_f16;
1597 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_bf16_w32:
1598 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_bf16_w64:
1599 ArgsForMatchingMatrixTypes = {2, 0, 1, 3};
1600 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_f32_16x16x32_bf16;
1602 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x32_f16_w32:
1603 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x32_f16_w64:
1604 ArgsForMatchingMatrixTypes = {2, 0, 1, 3};
1605 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_f16_16x16x32_f16;
1607 case AMDGPU::BI__builtin_amdgcn_swmmac_bf16_16x16x32_bf16_w32:
1608 case AMDGPU::BI__builtin_amdgcn_swmmac_bf16_16x16x32_bf16_w64:
1609 ArgsForMatchingMatrixTypes = {2, 0, 1, 3};
1610 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_bf16_16x16x32_bf16;
1612 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x32_iu8_w32:
1613 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x32_iu8_w64:
1614 ArgsForMatchingMatrixTypes = {4, 1, 3, 5};
1615 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_i32_16x16x32_iu8;
1617 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x32_iu4_w32:
1618 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x32_iu4_w64:
1619 ArgsForMatchingMatrixTypes = {4, 1, 3, 5};
1620 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_i32_16x16x32_iu4;
1622 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x64_iu4_w32:
1623 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x64_iu4_w64:
1624 ArgsForMatchingMatrixTypes = {4, 1, 3, 5};
1625 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_i32_16x16x64_iu4;
1627 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_fp8_fp8_w32:
1628 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_fp8_fp8_w64:
1629 ArgsForMatchingMatrixTypes = {2, 0, 1, 3};
1630 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_f32_16x16x32_fp8_fp8;
1632 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_fp8_bf8_w32:
1633 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_fp8_bf8_w64:
1634 ArgsForMatchingMatrixTypes = {2, 0, 1, 3};
1635 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_f32_16x16x32_fp8_bf8;
1637 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_bf8_fp8_w32:
1638 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_bf8_fp8_w64:
1639 ArgsForMatchingMatrixTypes = {2, 0, 1, 3};
1640 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_f32_16x16x32_bf8_fp8;
1642 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_bf8_bf8_w32:
1643 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x32_bf8_bf8_w64:
1644 ArgsForMatchingMatrixTypes = {2, 0, 1, 3};
1645 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_f32_16x16x32_bf8_bf8;
1648 case AMDGPU::BI__builtin_amdgcn_wmma_f64_16x16x4_f64:
1649 ArgsForMatchingMatrixTypes = {5, 1};
1650 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f64_16x16x4_f64;
1652 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x4_f32:
1653 ArgsForMatchingMatrixTypes = {3, 0};
1654 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f32_16x16x4_f32;
1657 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x32_bf16:
1658 ArgsForMatchingMatrixTypes = {3, 0};
1659 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f32_16x16x32_bf16;
1662 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x32_f16:
1663 ArgsForMatchingMatrixTypes = {3, 0};
1664 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f32_16x16x32_f16;
1667 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x32_f16:
1668 ArgsForMatchingMatrixTypes = {3, 0};
1669 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f16_16x16x32_f16;
1672 case AMDGPU::BI__builtin_amdgcn_wmma_bf16_16x16x32_bf16:
1673 ArgsForMatchingMatrixTypes = {3, 0};
1674 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_bf16_16x16x32_bf16;
1677 case AMDGPU::BI__builtin_amdgcn_wmma_bf16f32_16x16x32_bf16:
1678 NeedReturnType =
true;
1679 ArgsForMatchingMatrixTypes = {0, 3};
1680 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_bf16f32_16x16x32_bf16;
1683 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x64_fp8_fp8:
1684 ArgsForMatchingMatrixTypes = {3, 0};
1685 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f32_16x16x64_fp8_fp8;
1687 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x64_fp8_bf8:
1688 ArgsForMatchingMatrixTypes = {3, 0};
1689 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f32_16x16x64_fp8_bf8;
1691 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x64_bf8_fp8:
1692 ArgsForMatchingMatrixTypes = {3, 0};
1693 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f32_16x16x64_bf8_fp8;
1695 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x64_bf8_bf8:
1696 ArgsForMatchingMatrixTypes = {3, 0};
1697 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f32_16x16x64_bf8_bf8;
1699 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x64_fp8_fp8:
1700 ArgsForMatchingMatrixTypes = {3, 0};
1701 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f16_16x16x64_fp8_fp8;
1703 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x64_fp8_bf8:
1704 ArgsForMatchingMatrixTypes = {3, 0};
1705 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f16_16x16x64_fp8_bf8;
1707 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x64_bf8_fp8:
1708 ArgsForMatchingMatrixTypes = {3, 0};
1709 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f16_16x16x64_bf8_fp8;
1711 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x64_bf8_bf8:
1712 ArgsForMatchingMatrixTypes = {3, 0};
1713 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f16_16x16x64_bf8_bf8;
1715 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x128_fp8_fp8:
1716 ArgsForMatchingMatrixTypes = {3, 0};
1717 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f16_16x16x128_fp8_fp8;
1719 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x128_fp8_bf8:
1720 ArgsForMatchingMatrixTypes = {3, 0};
1721 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f16_16x16x128_fp8_bf8;
1723 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x128_bf8_fp8:
1724 ArgsForMatchingMatrixTypes = {3, 0};
1725 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f16_16x16x128_bf8_fp8;
1727 case AMDGPU::BI__builtin_amdgcn_wmma_f16_16x16x128_bf8_bf8:
1728 ArgsForMatchingMatrixTypes = {3, 0};
1729 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f16_16x16x128_bf8_bf8;
1731 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x128_fp8_fp8:
1732 ArgsForMatchingMatrixTypes = {3, 0};
1733 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f32_16x16x128_fp8_fp8;
1735 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x128_fp8_bf8:
1736 ArgsForMatchingMatrixTypes = {3, 0};
1737 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f32_16x16x128_fp8_bf8;
1739 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x128_bf8_fp8:
1740 ArgsForMatchingMatrixTypes = {3, 0};
1741 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f32_16x16x128_bf8_fp8;
1743 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x128_bf8_bf8:
1744 ArgsForMatchingMatrixTypes = {3, 0};
1745 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f32_16x16x128_bf8_bf8;
1747 case AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x64_iu8:
1748 ArgsForMatchingMatrixTypes = {4, 1};
1749 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_i32_16x16x64_iu8;
1751 case AMDGPU::BI__builtin_amdgcn_wmma_f32_16x16x128_f8f6f4:
1752 ArgsForMatchingMatrixTypes = {5, 1, 3};
1753 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f32_16x16x128_f8f6f4;
1755 case AMDGPU::BI__builtin_amdgcn_wmma_scale_f32_16x16x128_f8f6f4:
1756 ArgsForMatchingMatrixTypes = {5, 1, 3};
1757 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_scale_f32_16x16x128_f8f6f4;
1759 case AMDGPU::BI__builtin_amdgcn_wmma_scale16_f32_16x16x128_f8f6f4:
1760 ArgsForMatchingMatrixTypes = {5, 1, 3};
1761 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_scale16_f32_16x16x128_f8f6f4;
1763 case AMDGPU::BI__builtin_amdgcn_wmma_f32_32x16x128_f4:
1764 ArgsForMatchingMatrixTypes = {3, 0, 1};
1765 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_f32_32x16x128_f4;
1767 case AMDGPU::BI__builtin_amdgcn_wmma_scale_f32_32x16x128_f4:
1768 ArgsForMatchingMatrixTypes = {3, 0, 1};
1769 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_scale_f32_32x16x128_f4;
1771 case AMDGPU::BI__builtin_amdgcn_wmma_scale16_f32_32x16x128_f4:
1772 ArgsForMatchingMatrixTypes = {3, 0, 1};
1773 BuiltinWMMAOp = Intrinsic::amdgcn_wmma_scale16_f32_32x16x128_f4;
1775 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x64_f16:
1776 ArgsForMatchingMatrixTypes = {4, 1, 3, 5};
1777 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_f32_16x16x64_f16;
1779 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x64_bf16:
1780 ArgsForMatchingMatrixTypes = {4, 1, 3, 5};
1781 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_f32_16x16x64_bf16;
1783 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x64_f16:
1784 ArgsForMatchingMatrixTypes = {4, 1, 3, 5};
1785 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_f16_16x16x64_f16;
1787 case AMDGPU::BI__builtin_amdgcn_swmmac_bf16_16x16x64_bf16:
1788 ArgsForMatchingMatrixTypes = {4, 1, 3, 5};
1789 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_bf16_16x16x64_bf16;
1791 case AMDGPU::BI__builtin_amdgcn_swmmac_bf16f32_16x16x64_bf16:
1792 ArgsForMatchingMatrixTypes = {4, 1, 3, 5};
1793 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_bf16f32_16x16x64_bf16;
1795 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x128_fp8_fp8:
1796 ArgsForMatchingMatrixTypes = {2, 0, 1, 3};
1797 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_f32_16x16x128_fp8_fp8;
1799 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x128_fp8_bf8:
1800 ArgsForMatchingMatrixTypes = {2, 0, 1, 3};
1801 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_f32_16x16x128_fp8_bf8;
1803 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x128_bf8_fp8:
1804 ArgsForMatchingMatrixTypes = {2, 0, 1, 3};
1805 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_f32_16x16x128_bf8_fp8;
1807 case AMDGPU::BI__builtin_amdgcn_swmmac_f32_16x16x128_bf8_bf8:
1808 ArgsForMatchingMatrixTypes = {2, 0, 1, 3};
1809 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_f32_16x16x128_bf8_bf8;
1811 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x128_fp8_fp8:
1812 ArgsForMatchingMatrixTypes = {2, 0, 1, 3};
1813 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_f16_16x16x128_fp8_fp8;
1815 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x128_fp8_bf8:
1816 ArgsForMatchingMatrixTypes = {2, 0, 1, 3};
1817 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_f16_16x16x128_fp8_bf8;
1819 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x128_bf8_fp8:
1820 ArgsForMatchingMatrixTypes = {2, 0, 1, 3};
1821 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_f16_16x16x128_bf8_fp8;
1823 case AMDGPU::BI__builtin_amdgcn_swmmac_f16_16x16x128_bf8_bf8:
1824 ArgsForMatchingMatrixTypes = {2, 0, 1, 3};
1825 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_f16_16x16x128_bf8_bf8;
1827 case AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x128_iu8:
1828 ArgsForMatchingMatrixTypes = {4, 1, 3, 5};
1829 BuiltinWMMAOp = Intrinsic::amdgcn_swmmac_i32_16x16x128_iu8;
1834 for (
int i = 0, e = E->
getNumArgs(); i != e; ++i) {
1836 if (RemoveABNeg && (i == 0 || i == 2))
1840 if (AppendFalseForOpselArg)
1841 Args.push_back(
Builder.getFalse());
1844 if (BuiltinID == AMDGPU::BI__builtin_amdgcn_wmma_i32_16x16x64_iu8) {
1845 if (Args.size() == 7)
1846 Args.push_back(
Builder.getFalse());
1847 assert(Args.size() == 8 &&
"Expected 8 arguments");
1848 Args[7] =
Builder.CreateZExtOrTrunc(Args[7],
Builder.getInt1Ty());
1849 }
else if (BuiltinID ==
1850 AMDGPU::BI__builtin_amdgcn_swmmac_i32_16x16x128_iu8) {
1851 if (Args.size() == 8)
1852 Args.push_back(
Builder.getFalse());
1853 assert(Args.size() == 9 &&
"Expected 9 arguments");
1854 Args[8] =
Builder.CreateZExtOrTrunc(Args[8],
Builder.getInt1Ty());
1860 for (
auto ArgIdx : ArgsForMatchingMatrixTypes)
1861 ArgTypes.push_back(Args[ArgIdx]->
getType());
1863 Function *F =
CGM.getIntrinsic(BuiltinWMMAOp, ArgTypes);
1864 return Builder.CreateCall(F, Args);
1867 case AMDGPU::BI__builtin_amdgcn_workgroup_size_x:
1868 return EmitAMDGPUWorkGroupSize(*
this, 0);
1869 case AMDGPU::BI__builtin_amdgcn_workgroup_size_y:
1870 return EmitAMDGPUWorkGroupSize(*
this, 1);
1871 case AMDGPU::BI__builtin_amdgcn_workgroup_size_z:
1872 return EmitAMDGPUWorkGroupSize(*
this, 2);
1875 case AMDGPU::BI__builtin_amdgcn_grid_size_x:
1876 return EmitAMDGPUGridSize(*
this, 0);
1877 case AMDGPU::BI__builtin_amdgcn_grid_size_y:
1878 return EmitAMDGPUGridSize(*
this, 1);
1879 case AMDGPU::BI__builtin_amdgcn_grid_size_z:
1880 return EmitAMDGPUGridSize(*
this, 2);
1883 case AMDGPU::BI__builtin_r600_recipsqrt_ieee:
1884 case AMDGPU::BI__builtin_r600_recipsqrt_ieeef:
1886 Intrinsic::r600_recipsqrt_ieee);
1887 case AMDGPU::BI__builtin_amdgcn_alignbit: {
1891 Function *F =
CGM.getIntrinsic(Intrinsic::fshr, Src0->getType());
1892 return Builder.CreateCall(F, { Src0, Src1, Src2 });
1894 case AMDGPU::BI__builtin_amdgcn_fence: {
1897 FenceInst *Fence =
Builder.CreateFence(AO, SSID);
1902 case AMDGPU::BI__builtin_amdgcn_atomic_inc32:
1903 case AMDGPU::BI__builtin_amdgcn_atomic_inc64:
1904 case AMDGPU::BI__builtin_amdgcn_atomic_dec32:
1905 case AMDGPU::BI__builtin_amdgcn_atomic_dec64:
1906 case AMDGPU::BI__builtin_amdgcn_ds_atomic_fadd_f64:
1907 case AMDGPU::BI__builtin_amdgcn_ds_atomic_fadd_f32:
1908 case AMDGPU::BI__builtin_amdgcn_ds_atomic_fadd_v2f16:
1909 case AMDGPU::BI__builtin_amdgcn_ds_atomic_fadd_v2bf16:
1910 case AMDGPU::BI__builtin_amdgcn_ds_faddf:
1911 case AMDGPU::BI__builtin_amdgcn_ds_fminf:
1912 case AMDGPU::BI__builtin_amdgcn_ds_fmaxf:
1913 case AMDGPU::BI__builtin_amdgcn_global_atomic_fadd_f32:
1914 case AMDGPU::BI__builtin_amdgcn_global_atomic_fadd_f64:
1915 case AMDGPU::BI__builtin_amdgcn_global_atomic_fadd_v2f16:
1916 case AMDGPU::BI__builtin_amdgcn_flat_atomic_fadd_v2f16:
1917 case AMDGPU::BI__builtin_amdgcn_flat_atomic_fadd_f32:
1918 case AMDGPU::BI__builtin_amdgcn_flat_atomic_fadd_f64:
1919 case AMDGPU::BI__builtin_amdgcn_global_atomic_fadd_v2bf16:
1920 case AMDGPU::BI__builtin_amdgcn_flat_atomic_fadd_v2bf16:
1921 case AMDGPU::BI__builtin_amdgcn_global_atomic_fmin_f64:
1922 case AMDGPU::BI__builtin_amdgcn_global_atomic_fmax_f64:
1923 case AMDGPU::BI__builtin_amdgcn_flat_atomic_fmin_f64:
1924 case AMDGPU::BI__builtin_amdgcn_flat_atomic_fmax_f64: {
1925 llvm::AtomicRMWInst::BinOp BinOp;
1926 switch (BuiltinID) {
1927 case AMDGPU::BI__builtin_amdgcn_atomic_inc32:
1928 case AMDGPU::BI__builtin_amdgcn_atomic_inc64:
1929 BinOp = llvm::AtomicRMWInst::UIncWrap;
1931 case AMDGPU::BI__builtin_amdgcn_atomic_dec32:
1932 case AMDGPU::BI__builtin_amdgcn_atomic_dec64:
1933 BinOp = llvm::AtomicRMWInst::UDecWrap;
1935 case AMDGPU::BI__builtin_amdgcn_ds_faddf:
1936 case AMDGPU::BI__builtin_amdgcn_ds_atomic_fadd_f64:
1937 case AMDGPU::BI__builtin_amdgcn_ds_atomic_fadd_f32:
1938 case AMDGPU::BI__builtin_amdgcn_ds_atomic_fadd_v2f16:
1939 case AMDGPU::BI__builtin_amdgcn_ds_atomic_fadd_v2bf16:
1940 case AMDGPU::BI__builtin_amdgcn_global_atomic_fadd_f32:
1941 case AMDGPU::BI__builtin_amdgcn_global_atomic_fadd_f64:
1942 case AMDGPU::BI__builtin_amdgcn_global_atomic_fadd_v2f16:
1943 case AMDGPU::BI__builtin_amdgcn_flat_atomic_fadd_v2f16:
1944 case AMDGPU::BI__builtin_amdgcn_flat_atomic_fadd_f32:
1945 case AMDGPU::BI__builtin_amdgcn_flat_atomic_fadd_f64:
1946 case AMDGPU::BI__builtin_amdgcn_global_atomic_fadd_v2bf16:
1947 case AMDGPU::BI__builtin_amdgcn_flat_atomic_fadd_v2bf16:
1948 BinOp = llvm::AtomicRMWInst::FAdd;
1950 case AMDGPU::BI__builtin_amdgcn_ds_fminf:
1951 case AMDGPU::BI__builtin_amdgcn_global_atomic_fmin_f64:
1952 case AMDGPU::BI__builtin_amdgcn_flat_atomic_fmin_f64:
1953 BinOp = llvm::AtomicRMWInst::FMin;
1955 case AMDGPU::BI__builtin_amdgcn_global_atomic_fmax_f64:
1956 case AMDGPU::BI__builtin_amdgcn_flat_atomic_fmax_f64:
1957 case AMDGPU::BI__builtin_amdgcn_ds_fmaxf:
1958 BinOp = llvm::AtomicRMWInst::FMax;
1964 llvm::Type *OrigTy = Val->
getType();
1969 if (BuiltinID == AMDGPU::BI__builtin_amdgcn_ds_faddf ||
1970 BuiltinID == AMDGPU::BI__builtin_amdgcn_ds_fminf ||
1971 BuiltinID == AMDGPU::BI__builtin_amdgcn_ds_fmaxf) {
1996 AO = AtomicOrdering::Monotonic;
1999 if (BuiltinID == AMDGPU::BI__builtin_amdgcn_ds_atomic_fadd_v2bf16 ||
2000 BuiltinID == AMDGPU::BI__builtin_amdgcn_global_atomic_fadd_v2bf16 ||
2001 BuiltinID == AMDGPU::BI__builtin_amdgcn_flat_atomic_fadd_v2bf16) {
2002 llvm::Type *V2BF16Ty = FixedVectorType::get(
2003 llvm::Type::getBFloatTy(
Builder.getContext()), 2);
2004 Val =
Builder.CreateBitCast(Val, V2BF16Ty);
2008 llvm::AtomicRMWInst *RMW =
2009 Builder.CreateAtomicRMW(BinOp, Ptr, Val, AO, SSID);
2011 RMW->setVolatile(
true);
2013 unsigned AddrSpace = Ptr.
getType()->getAddressSpace();
2014 if (AddrSpace != llvm::AMDGPUAS::LOCAL_ADDRESS) {
2018 RMW->setMetadata(
"amdgpu.no.fine.grained.memory", EmptyMD);
2022 if (BinOp == llvm::AtomicRMWInst::FAdd && Val->
getType()->isFloatTy())
2023 RMW->setMetadata(
"amdgpu.ignore.denormal.mode", EmptyMD);
2026 return Builder.CreateBitCast(RMW, OrigTy);
2028 case AMDGPU::BI__builtin_amdgcn_s_sendmsg_rtn:
2029 case AMDGPU::BI__builtin_amdgcn_s_sendmsg_rtnl: {
2034 CGM.getIntrinsic(Intrinsic::amdgcn_s_sendmsg_rtn, {ResultType});
2035 return Builder.CreateCall(F, {Arg});
2037 case AMDGPU::BI__builtin_amdgcn_permlane16_swap:
2038 case AMDGPU::BI__builtin_amdgcn_permlane32_swap: {
2046 CGM.getIntrinsic(BuiltinID == AMDGPU::BI__builtin_amdgcn_permlane16_swap
2047 ? Intrinsic::amdgcn_permlane16_swap
2048 : Intrinsic::amdgcn_permlane32_swap);
2049 llvm::CallInst *
Call =
2050 Builder.CreateCall(F, {VDstOld, VSrcOld, FI, BoundCtrl});
2052 llvm::Value *Elt0 =
Builder.CreateExtractValue(
Call, 0);
2053 llvm::Value *Elt1 =
Builder.CreateExtractValue(
Call, 1);
2057 llvm::Value *Insert0 =
Builder.CreateInsertElement(
2058 llvm::PoisonValue::get(ResultType), Elt0, UINT64_C(0));
2059 llvm::Value *AsVector =
2060 Builder.CreateInsertElement(Insert0, Elt1, UINT64_C(1));
2063 case AMDGPU::BI__builtin_amdgcn_bitop3_b32:
2064 case AMDGPU::BI__builtin_amdgcn_bitop3_b16:
2066 Intrinsic::amdgcn_bitop3);
2067 case AMDGPU::BI__builtin_amdgcn_make_buffer_rsrc: {
2072 for (
unsigned I = 0; I < 4; ++I)
2074 llvm::PointerType *RetTy = llvm::PointerType::get(
2075 Builder.getContext(), llvm::AMDGPUAS::BUFFER_RESOURCE);
2076 Function *F =
CGM.getIntrinsic(Intrinsic::amdgcn_make_buffer_rsrc,
2077 {RetTy, Args[0]->getType()});
2078 return Builder.CreateCall(F, Args);
2080 case AMDGPU::BI__builtin_amdgcn_raw_buffer_store_b8:
2081 case AMDGPU::BI__builtin_amdgcn_raw_buffer_store_b16:
2082 case AMDGPU::BI__builtin_amdgcn_raw_buffer_store_b32:
2083 case AMDGPU::BI__builtin_amdgcn_raw_buffer_store_b64:
2084 case AMDGPU::BI__builtin_amdgcn_raw_buffer_store_b96:
2085 case AMDGPU::BI__builtin_amdgcn_raw_buffer_store_b128:
2087 *
this, E, Intrinsic::amdgcn_raw_ptr_buffer_store);
2088 case AMDGPU::BI__builtin_amdgcn_raw_buffer_store_format_v4f32:
2089 case AMDGPU::BI__builtin_amdgcn_raw_buffer_store_format_v4f16:
2091 *
this, E, Intrinsic::amdgcn_raw_ptr_buffer_store_format);
2092 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_b8:
2093 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_b16:
2094 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_b32:
2095 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_b64:
2096 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_b96:
2097 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_b128: {
2098 llvm::Type *RetTy =
nullptr;
2099 switch (BuiltinID) {
2100 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_b8:
2103 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_b16:
2106 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_b32:
2109 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_b64:
2110 RetTy = llvm::FixedVectorType::get(
Int32Ty, 2);
2112 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_b96:
2113 RetTy = llvm::FixedVectorType::get(
Int32Ty, 3);
2115 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_b128:
2116 RetTy = llvm::FixedVectorType::get(
Int32Ty, 4);
2120 CGM.getIntrinsic(Intrinsic::amdgcn_raw_ptr_buffer_load, RetTy);
2125 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_format_v4f32:
2126 case AMDGPU::BI__builtin_amdgcn_raw_buffer_load_format_v4f16: {
2129 CGM.getIntrinsic(Intrinsic::amdgcn_raw_ptr_buffer_load_format, {RetTy});
2135 case AMDGPU::BI__builtin_amdgcn_struct_buffer_store_format_v4f32:
2136 case AMDGPU::BI__builtin_amdgcn_struct_buffer_store_format_v4f16:
2138 *
this, E, Intrinsic::amdgcn_struct_ptr_buffer_store_format);
2139 case AMDGPU::BI__builtin_amdgcn_struct_buffer_load_format_v4f32:
2140 case AMDGPU::BI__builtin_amdgcn_struct_buffer_load_format_v4f16: {
2143 Intrinsic::amdgcn_struct_ptr_buffer_load_format, {RetTy});
2150 case AMDGPU::BI__builtin_amdgcn_raw_ptr_buffer_atomic_add_i32:
2152 *
this, E, Intrinsic::amdgcn_raw_ptr_buffer_atomic_add);
2153 case AMDGPU::BI__builtin_amdgcn_raw_ptr_buffer_atomic_fadd_f32:
2154 case AMDGPU::BI__builtin_amdgcn_raw_ptr_buffer_atomic_fadd_v2f16:
2156 *
this, E, Intrinsic::amdgcn_raw_ptr_buffer_atomic_fadd);
2157 case AMDGPU::BI__builtin_amdgcn_raw_ptr_buffer_atomic_fmin_f32:
2158 case AMDGPU::BI__builtin_amdgcn_raw_ptr_buffer_atomic_fmin_f64:
2160 *
this, E, Intrinsic::amdgcn_raw_ptr_buffer_atomic_fmin);
2161 case AMDGPU::BI__builtin_amdgcn_raw_ptr_buffer_atomic_fmax_f32:
2162 case AMDGPU::BI__builtin_amdgcn_raw_ptr_buffer_atomic_fmax_f64:
2164 *
this, E, Intrinsic::amdgcn_raw_ptr_buffer_atomic_fmax);
2165 case AMDGPU::BI__builtin_amdgcn_s_prefetch_data:
2167 *
this, E, Intrinsic::amdgcn_s_prefetch_data);
2168 case Builtin::BIlogbf:
2169 case Builtin::BI__builtin_logbf: {
2173 CallInst *FrExp =
Builder.CreateCall(FrExpFunc, Src0);
2176 Exp, ConstantInt::getSigned(Exp->
getType(), -1),
"",
false,
true);
2181 Fabs, ConstantFP::getInfinity(
Builder.getFloatTy()));
2182 Value *Sel1 =
Builder.CreateSelect(FCmpONE, SIToFP, Fabs);
2184 Builder.CreateFCmpOEQ(Src0, ConstantFP::getZero(
Builder.getFloatTy()));
2187 ConstantFP::getInfinity(
Builder.getFloatTy(),
true), Sel1);
2190 case Builtin::BIlogb:
2191 case Builtin::BI__builtin_logb: {
2195 CallInst *FrExp =
Builder.CreateCall(FrExpFunc, Src0);
2198 Exp, ConstantInt::getSigned(Exp->
getType(), -1),
"",
false,
true);
2203 Fabs, ConstantFP::getInfinity(
Builder.getDoubleTy()));
2204 Value *Sel1 =
Builder.CreateSelect(FCmpONE, SIToFP, Fabs);
2206 Builder.CreateFCmpOEQ(Src0, ConstantFP::getZero(
Builder.getDoubleTy()));
2209 ConstantFP::getInfinity(
Builder.getDoubleTy(),
true),
2213 case Builtin::BIscalbnf:
2214 case Builtin::BI__builtin_scalbnf:
2215 case Builtin::BIscalbn:
2216 case Builtin::BI__builtin_scalbn:
2218 *
this, E, Intrinsic::ldexp, Intrinsic::experimental_constrained_ldexp);
2219 case AMDGPU::BI__builtin_amdgcn_permlane_bcast:
2221 *
this, E, Intrinsic::amdgcn_permlane_bcast);
2222 case AMDGPU::BI__builtin_amdgcn_permlane_up:
2224 Intrinsic::amdgcn_permlane_up);
2225 case AMDGPU::BI__builtin_amdgcn_permlane_down:
2227 Intrinsic::amdgcn_permlane_down);
2228 case AMDGPU::BI__builtin_amdgcn_permlane_xor:
2230 Intrinsic::amdgcn_permlane_xor);