626 unsigned altLLVMIntrinsic,
const char *nameHint,
unsigned modifier,
628 mlir::Location loc = cgf.
getLoc(
expr->getExprLoc());
635 std::optional<llvm::APSInt> neonTypeConst = arg->getIntegerConstantExpr(ctx);
652 cir::VectorType vTy =
getNeonType(&cgf, neonType, loc, hasLegalHalfType,
653 false, allowBFloatArgsAndRet);
654 cir::VectorType ty = vTy;
659 case NEON::BI__builtin_neon_splat_lane_v:
660 case NEON::BI__builtin_neon_splat_laneq_v:
661 case NEON::BI__builtin_neon_splatq_lane_v:
662 case NEON::BI__builtin_neon_splatq_laneq_v: {
663 uint64_t numElements = vTy.getSize();
664 if (builtinID == NEON::BI__builtin_neon_splatq_lane_v)
666 if (builtinID == NEON::BI__builtin_neon_splat_laneq_v)
671 case NEON::BI__builtin_neon_vpadd_v:
672 case NEON::BI__builtin_neon_vpaddq_v:
673 case NEON::BI__builtin_neon_vabs_v:
674 case NEON::BI__builtin_neon_vabsq_v:
676 std::string(
"unimplemented AArch64 builtin call: ") +
678 return mlir::Value{};
679 case NEON::BI__builtin_neon_vadd_v:
680 case NEON::BI__builtin_neon_vaddq_v: {
681 unsigned numBytes = (builtinID == NEON::BI__builtin_neon_vaddq_v) ? 16 : 8;
682 cir::VectorType byteTy =
689 case NEON::BI__builtin_neon_vaddhn_v:
690 case NEON::BI__builtin_neon_vcale_v:
691 case NEON::BI__builtin_neon_vcaleq_v:
692 case NEON::BI__builtin_neon_vcalt_v:
693 case NEON::BI__builtin_neon_vcaltq_v:
694 case NEON::BI__builtin_neon_vcage_v:
695 case NEON::BI__builtin_neon_vcageq_v:
696 case NEON::BI__builtin_neon_vcagt_v:
697 case NEON::BI__builtin_neon_vcagtq_v:
699 std::string(
"unimplemented AArch64 builtin call: ") +
701 return mlir::Value{};
702 case NEON::BI__builtin_neon_vceqz_v:
703 case NEON::BI__builtin_neon_vceqzq_v:
705 vTy, cir::CmpOpKind::eq);
706 case NEON::BI__builtin_neon_vcgez_v:
707 case NEON::BI__builtin_neon_vcgezq_v:
708 case NEON::BI__builtin_neon_vclez_v:
709 case NEON::BI__builtin_neon_vclezq_v:
710 case NEON::BI__builtin_neon_vcgtz_v:
711 case NEON::BI__builtin_neon_vcgtzq_v:
712 case NEON::BI__builtin_neon_vcltz_v:
713 case NEON::BI__builtin_neon_vcltzq_v:
714 case NEON::BI__builtin_neon_vclz_v:
715 case NEON::BI__builtin_neon_vclzq_v:
716 case NEON::BI__builtin_neon_vcvt_f32_v:
717 case NEON::BI__builtin_neon_vcvtq_f32_v:
718 case NEON::BI__builtin_neon_vcvt_f16_s16:
719 case NEON::BI__builtin_neon_vcvt_f16_u16:
720 case NEON::BI__builtin_neon_vcvtq_f16_s16:
721 case NEON::BI__builtin_neon_vcvtq_f16_u16:
722 case NEON::BI__builtin_neon_vcvt_n_f16_s16:
723 case NEON::BI__builtin_neon_vcvt_n_f16_u16:
724 case NEON::BI__builtin_neon_vcvtq_n_f16_s16:
725 case NEON::BI__builtin_neon_vcvtq_n_f16_u16:
727 std::string(
"unimplemented AArch64 builtin call: ") +
729 return mlir::Value{};
730 case NEON::BI__builtin_neon_vcvt_n_f32_v:
731 case NEON::BI__builtin_neon_vcvt_n_f64_v:
732 case NEON::BI__builtin_neon_vcvtq_n_f32_v:
733 case NEON::BI__builtin_neon_vcvtq_n_f64_v: {
736 llvm::StringRef llvmIntrName =
738 usgn ? llvmIntrinsic : altLLVMIntrinsic));
740 {vTy, cstIntTy}, ops, llvmIntrName,
743 case NEON::BI__builtin_neon_vcvt_n_s16_f16:
744 case NEON::BI__builtin_neon_vcvt_n_s32_v:
745 case NEON::BI__builtin_neon_vcvt_n_u16_f16:
746 case NEON::BI__builtin_neon_vcvt_n_u32_v:
747 case NEON::BI__builtin_neon_vcvt_n_s64_v:
748 case NEON::BI__builtin_neon_vcvt_n_u64_v:
749 case NEON::BI__builtin_neon_vcvtq_n_s16_f16:
750 case NEON::BI__builtin_neon_vcvtq_n_s32_v:
751 case NEON::BI__builtin_neon_vcvtq_n_u16_f16:
752 case NEON::BI__builtin_neon_vcvtq_n_u32_v:
753 case NEON::BI__builtin_neon_vcvtq_n_s64_v:
754 case NEON::BI__builtin_neon_vcvtq_n_u64_v: {
758 static_cast<llvm::Intrinsic::ID
>(llvmIntrinsic));
761 {getFloatNeonType(cgf, neonType), cstIntTy}, ops,
765 case NEON::BI__builtin_neon_vcvt_s32_v:
766 case NEON::BI__builtin_neon_vcvt_u32_v:
767 case NEON::BI__builtin_neon_vcvt_s64_v:
768 case NEON::BI__builtin_neon_vcvt_u64_v:
769 case NEON::BI__builtin_neon_vcvt_s16_f16:
770 case NEON::BI__builtin_neon_vcvt_u16_f16:
771 case NEON::BI__builtin_neon_vcvtq_s32_v:
772 case NEON::BI__builtin_neon_vcvtq_u32_v:
773 case NEON::BI__builtin_neon_vcvtq_s64_v:
774 case NEON::BI__builtin_neon_vcvtq_u64_v:
775 case NEON::BI__builtin_neon_vcvtq_s16_f16:
776 case NEON::BI__builtin_neon_vcvtq_u16_f16: {
786 llvm::StringRef llvmIntrName = usgn ?
"fptoui.sat" :
"fptosi.sat";
788 {ty}, ops, llvmIntrName, vTy, loc);
790 case NEON::BI__builtin_neon_vcvta_s16_f16:
791 case NEON::BI__builtin_neon_vcvta_s32_v:
792 case NEON::BI__builtin_neon_vcvta_s64_v:
793 case NEON::BI__builtin_neon_vcvta_u16_f16:
794 case NEON::BI__builtin_neon_vcvta_u32_v:
795 case NEON::BI__builtin_neon_vcvta_u64_v:
796 case NEON::BI__builtin_neon_vcvtaq_s16_f16:
797 case NEON::BI__builtin_neon_vcvtaq_s32_v:
798 case NEON::BI__builtin_neon_vcvtaq_s64_v:
799 case NEON::BI__builtin_neon_vcvtaq_u16_f16:
800 case NEON::BI__builtin_neon_vcvtaq_u32_v:
801 case NEON::BI__builtin_neon_vcvtaq_u64_v:
802 case NEON::BI__builtin_neon_vcvtn_s16_f16:
803 case NEON::BI__builtin_neon_vcvtn_s32_v:
804 case NEON::BI__builtin_neon_vcvtn_s64_v:
805 case NEON::BI__builtin_neon_vcvtn_u16_f16:
806 case NEON::BI__builtin_neon_vcvtn_u32_v:
807 case NEON::BI__builtin_neon_vcvtn_u64_v:
808 case NEON::BI__builtin_neon_vcvtnq_s16_f16:
809 case NEON::BI__builtin_neon_vcvtnq_s32_v:
810 case NEON::BI__builtin_neon_vcvtnq_s64_v:
811 case NEON::BI__builtin_neon_vcvtnq_u16_f16:
812 case NEON::BI__builtin_neon_vcvtnq_u32_v:
813 case NEON::BI__builtin_neon_vcvtnq_u64_v:
814 case NEON::BI__builtin_neon_vcvtp_s16_f16:
815 case NEON::BI__builtin_neon_vcvtp_s32_v:
816 case NEON::BI__builtin_neon_vcvtp_s64_v:
817 case NEON::BI__builtin_neon_vcvtp_u16_f16:
818 case NEON::BI__builtin_neon_vcvtp_u32_v:
819 case NEON::BI__builtin_neon_vcvtp_u64_v:
820 case NEON::BI__builtin_neon_vcvtpq_s16_f16:
821 case NEON::BI__builtin_neon_vcvtpq_s32_v:
822 case NEON::BI__builtin_neon_vcvtpq_s64_v:
823 case NEON::BI__builtin_neon_vcvtpq_u16_f16:
824 case NEON::BI__builtin_neon_vcvtpq_u32_v:
825 case NEON::BI__builtin_neon_vcvtpq_u64_v:
826 case NEON::BI__builtin_neon_vcvtm_s16_f16:
827 case NEON::BI__builtin_neon_vcvtm_s32_v:
828 case NEON::BI__builtin_neon_vcvtm_s64_v:
829 case NEON::BI__builtin_neon_vcvtm_u16_f16:
830 case NEON::BI__builtin_neon_vcvtm_u32_v:
831 case NEON::BI__builtin_neon_vcvtm_u64_v:
832 case NEON::BI__builtin_neon_vcvtmq_s16_f16:
833 case NEON::BI__builtin_neon_vcvtmq_s32_v:
834 case NEON::BI__builtin_neon_vcvtmq_s64_v:
835 case NEON::BI__builtin_neon_vcvtmq_u16_f16:
836 case NEON::BI__builtin_neon_vcvtmq_u32_v:
837 case NEON::BI__builtin_neon_vcvtmq_u64_v:
838 case NEON::BI__builtin_neon_vcvtx_f32_v:
839 case NEON::BI__builtin_neon_vext_v:
840 case NEON::BI__builtin_neon_vextq_v:
841 case NEON::BI__builtin_neon_vfma_v:
843 std::string(
"unimplemented AArch64 builtin call: ") +
845 return mlir::Value{};
846 case NEON::BI__builtin_neon_vfmaq_v: {
857 case NEON::BI__builtin_neon_vld1_v:
858 case NEON::BI__builtin_neon_vld1q_v:
859 case NEON::BI__builtin_neon_vld1_x2_v:
860 case NEON::BI__builtin_neon_vld1q_x2_v:
861 case NEON::BI__builtin_neon_vld1_x3_v:
862 case NEON::BI__builtin_neon_vld1q_x3_v:
863 case NEON::BI__builtin_neon_vld1_x4_v:
864 case NEON::BI__builtin_neon_vld1q_x4_v:
865 case NEON::BI__builtin_neon_vld2_v:
866 case NEON::BI__builtin_neon_vld2q_v:
867 case NEON::BI__builtin_neon_vld3_v:
868 case NEON::BI__builtin_neon_vld3q_v:
869 case NEON::BI__builtin_neon_vld4_v:
870 case NEON::BI__builtin_neon_vld4q_v:
871 case NEON::BI__builtin_neon_vld2_dup_v:
872 case NEON::BI__builtin_neon_vld2q_dup_v:
873 case NEON::BI__builtin_neon_vld3_dup_v:
874 case NEON::BI__builtin_neon_vld3q_dup_v:
875 case NEON::BI__builtin_neon_vld4_dup_v:
876 case NEON::BI__builtin_neon_vld4q_dup_v:
877 case NEON::BI__builtin_neon_vld1_dup_v:
878 case NEON::BI__builtin_neon_vld1q_dup_v:
879 case NEON::BI__builtin_neon_vld2_lane_v:
880 case NEON::BI__builtin_neon_vld2q_lane_v:
881 case NEON::BI__builtin_neon_vld3_lane_v:
882 case NEON::BI__builtin_neon_vld3q_lane_v:
883 case NEON::BI__builtin_neon_vld4_lane_v:
884 case NEON::BI__builtin_neon_vld4q_lane_v:
885 case NEON::BI__builtin_neon_vmovl_v:
886 case NEON::BI__builtin_neon_vmovn_v:
887 case NEON::BI__builtin_neon_vmull_v:
888 case NEON::BI__builtin_neon_vpadal_v:
889 case NEON::BI__builtin_neon_vpadalq_v:
891 std::string(
"Reached code-path for ARM builtin call ") +
893 "(ARM builtins are not supported ATM)");
894 return mlir::Value{};
895 case NEON::BI__builtin_neon_vpaddl_v:
896 case NEON::BI__builtin_neon_vpaddlq_v: {
897 llvm::StringRef llvmIntrName =
899 usgn ? llvmIntrinsic : altLLVMIntrinsic));
901 {getNeonPairwiseWidenInputType(vTy, usgn)},
905 case NEON::BI__builtin_neon_vqdmlal_v:
906 case NEON::BI__builtin_neon_vqdmlsl_v:
907 case NEON::BI__builtin_neon_vqdmulhq_lane_v:
908 case NEON::BI__builtin_neon_vqdmulh_lane_v:
909 case NEON::BI__builtin_neon_vqrdmulhq_lane_v:
910 case NEON::BI__builtin_neon_vqrdmulh_lane_v:
911 case NEON::BI__builtin_neon_vqdmulhq_laneq_v:
912 case NEON::BI__builtin_neon_vqdmulh_laneq_v:
913 case NEON::BI__builtin_neon_vqrdmulhq_laneq_v:
914 case NEON::BI__builtin_neon_vqrdmulh_laneq_v:
915 case NEON::BI__builtin_neon_vqshl_n_v:
916 case NEON::BI__builtin_neon_vqshlq_n_v:
917 case NEON::BI__builtin_neon_vqshlu_n_v:
918 case NEON::BI__builtin_neon_vqshluq_n_v:
919 case NEON::BI__builtin_neon_vrecpe_v:
920 case NEON::BI__builtin_neon_vrecpeq_v:
921 case NEON::BI__builtin_neon_vrsqrte_v:
922 case NEON::BI__builtin_neon_vrsqrteq_v:
923 case NEON::BI__builtin_neon_vrndi_v:
924 case NEON::BI__builtin_neon_vrndiq_v:
926 std::string(
"unimplemented AArch64 builtin call: ") +
928 return mlir::Value{};
929 case NEON::BI__builtin_neon_vrshr_n_v:
930 case NEON::BI__builtin_neon_vrshrq_n_v: {
931 llvm::StringRef intrName =
932 usgn ?
"aarch64.neon.urshl" :
"aarch64.neon.srshl";
935 {ty, usgn ? getSignChangedVectorType(cgf.getBuilder(), ty) : ty}, ops,
936 intrName, ty, loc,
false,
940 case NEON::BI__builtin_neon_vsha512hq_u64:
941 case NEON::BI__builtin_neon_vsha512h2q_u64:
942 case NEON::BI__builtin_neon_vsha512su0q_u64:
943 case NEON::BI__builtin_neon_vsha512su1q_u64:
945 std::string(
"unimplemented AArch64 builtin call: ") +
947 return mlir::Value{};
948 case NEON::BI__builtin_neon_vshl_n_v:
949 case NEON::BI__builtin_neon_vshlq_n_v:
952 case NEON::BI__builtin_neon_vshll_n_v:
953 case NEON::BI__builtin_neon_vshrn_n_v:
955 std::string(
"unimplemented AArch64 builtin call: ") +
957 return mlir::Value{};
958 case NEON::BI__builtin_neon_vshr_n_v:
959 case NEON::BI__builtin_neon_vshrq_n_v:
961 case NEON::BI__builtin_neon_vst1_v:
962 case NEON::BI__builtin_neon_vst1q_v:
963 case NEON::BI__builtin_neon_vst2_v:
964 case NEON::BI__builtin_neon_vst2q_v:
965 case NEON::BI__builtin_neon_vst3_v:
966 case NEON::BI__builtin_neon_vst3q_v:
967 case NEON::BI__builtin_neon_vst4_v:
968 case NEON::BI__builtin_neon_vst4q_v:
969 case NEON::BI__builtin_neon_vst2_lane_v:
970 case NEON::BI__builtin_neon_vst2q_lane_v:
971 case NEON::BI__builtin_neon_vst3_lane_v:
972 case NEON::BI__builtin_neon_vst3q_lane_v:
973 case NEON::BI__builtin_neon_vst4_lane_v:
974 case NEON::BI__builtin_neon_vst4q_lane_v:
975 case NEON::BI__builtin_neon_vsm3partw1q_u32:
976 case NEON::BI__builtin_neon_vsm3partw2q_u32:
977 case NEON::BI__builtin_neon_vsm3ss1q_u32:
978 case NEON::BI__builtin_neon_vsm4ekeyq_u32:
979 case NEON::BI__builtin_neon_vsm4eq_u32:
980 case NEON::BI__builtin_neon_vsm3tt1aq_u32:
981 case NEON::BI__builtin_neon_vsm3tt1bq_u32:
982 case NEON::BI__builtin_neon_vsm3tt2aq_u32:
983 case NEON::BI__builtin_neon_vsm3tt2bq_u32:
984 case NEON::BI__builtin_neon_vst1_x2_v:
985 case NEON::BI__builtin_neon_vst1q_x2_v:
986 case NEON::BI__builtin_neon_vst1_x3_v:
987 case NEON::BI__builtin_neon_vst1q_x3_v:
988 case NEON::BI__builtin_neon_vst1_x4_v:
989 case NEON::BI__builtin_neon_vst1q_x4_v:
990 case NEON::BI__builtin_neon_vsubhn_v:
991 case NEON::BI__builtin_neon_vtrn_v:
992 case NEON::BI__builtin_neon_vtrnq_v:
993 case NEON::BI__builtin_neon_vtst_v:
994 case NEON::BI__builtin_neon_vtstq_v:
995 case NEON::BI__builtin_neon_vuzp_v:
996 case NEON::BI__builtin_neon_vuzpq_v:
997 case NEON::BI__builtin_neon_vxarq_u64:
998 case NEON::BI__builtin_neon_vzip_v:
999 case NEON::BI__builtin_neon_vzipq_v:
1000 case NEON::BI__builtin_neon_vdot_s32:
1001 case NEON::BI__builtin_neon_vdot_u32:
1002 case NEON::BI__builtin_neon_vdotq_s32:
1003 case NEON::BI__builtin_neon_vdotq_u32:
1004 case NEON::BI__builtin_neon_vfmlal_low_f16:
1005 case NEON::BI__builtin_neon_vfmlalq_low_f16:
1006 case NEON::BI__builtin_neon_vfmlsl_low_f16:
1007 case NEON::BI__builtin_neon_vfmlslq_low_f16:
1008 case NEON::BI__builtin_neon_vfmlal_high_f16:
1009 case NEON::BI__builtin_neon_vfmlalq_high_f16:
1010 case NEON::BI__builtin_neon_vfmlsl_high_f16:
1011 case NEON::BI__builtin_neon_vfmlslq_high_f16:
1012 case NEON::BI__builtin_neon_vmmlaq_s32:
1013 case NEON::BI__builtin_neon_vmmlaq_u32:
1015 std::string(
"unimplemented AArch64 builtin call: ") +
1017 return mlir::Value{};
1018 case NEON::BI__builtin_neon_vmul_v:
1019 case NEON::BI__builtin_neon_vmulq_v:
1022 case NEON::BI__builtin_neon_vusmmlaq_s32:
1023 case NEON::BI__builtin_neon_vusdot_s32:
1024 case NEON::BI__builtin_neon_vusdotq_s32:
1025 case NEON::BI__builtin_neon_vbfdot_f32:
1026 case NEON::BI__builtin_neon_vbfdotq_f32:
1027 case NEON::BI__builtin_neon___a32_vcvt_bf16_f32:
1029 std::string(
"unimplemented AArch64 builtin call: ") +
1031 return mlir::Value{};
1037 switch (builtinID) {
1040 std::string(
"unimplemented AArch64 builtin call: ") +
1043 case NEON::BI__builtin_neon_vshl_v:
1044 case NEON::BI__builtin_neon_vshlq_v: {
1045 llvm::StringRef llvmIntrName =
1047 usgn ? llvmIntrinsic : altLLVMIntrinsic));
1049 mlir::Value result =
1051 {vTy, vTy}, ops, llvmIntrName,
1467 NEON::BI__builtin_neon_splat_lane_bf16,
1468 NEON::BI__builtin_neon_splat_lane_v,
1471 NEON::BI__builtin_neon_splat_laneq_bf16,
1472 NEON::BI__builtin_neon_splat_laneq_v,
1475 NEON::BI__builtin_neon_splatq_lane_bf16,
1476 NEON::BI__builtin_neon_splatq_lane_v,
1479 NEON::BI__builtin_neon_splatq_laneq_bf16,
1480 NEON::BI__builtin_neon_splatq_laneq_v,
1483 NEON::BI__builtin_neon_vabd_f16,
1484 NEON::BI__builtin_neon_vabd_v,
1487 NEON::BI__builtin_neon_vabdq_f16,
1488 NEON::BI__builtin_neon_vabdq_v,
1491 NEON::BI__builtin_neon_vabs_f16,
1492 NEON::BI__builtin_neon_vabs_v,
1495 NEON::BI__builtin_neon_vabsq_f16,
1496 NEON::BI__builtin_neon_vabsq_v,
1499 NEON::BI__builtin_neon_vcage_f16,
1500 NEON::BI__builtin_neon_vcage_v,
1503 NEON::BI__builtin_neon_vcageq_f16,
1504 NEON::BI__builtin_neon_vcageq_v,
1507 NEON::BI__builtin_neon_vcagt_f16,
1508 NEON::BI__builtin_neon_vcagt_v,
1511 NEON::BI__builtin_neon_vcagtq_f16,
1512 NEON::BI__builtin_neon_vcagtq_v,
1515 NEON::BI__builtin_neon_vcale_f16,
1516 NEON::BI__builtin_neon_vcale_v,
1519 NEON::BI__builtin_neon_vcaleq_f16,
1520 NEON::BI__builtin_neon_vcaleq_v,
1523 NEON::BI__builtin_neon_vcalt_f16,
1524 NEON::BI__builtin_neon_vcalt_v,
1527 NEON::BI__builtin_neon_vcaltq_f16,
1528 NEON::BI__builtin_neon_vcaltq_v,
1531 NEON::BI__builtin_neon_vceqz_f16,
1532 NEON::BI__builtin_neon_vceqz_v,
1535 NEON::BI__builtin_neon_vceqzq_f16,
1536 NEON::BI__builtin_neon_vceqzq_v,
1539 NEON::BI__builtin_neon_vcgez_f16,
1540 NEON::BI__builtin_neon_vcgez_v,
1543 NEON::BI__builtin_neon_vcgezq_f16,
1544 NEON::BI__builtin_neon_vcgezq_v,
1547 NEON::BI__builtin_neon_vcgtz_f16,
1548 NEON::BI__builtin_neon_vcgtz_v,
1551 NEON::BI__builtin_neon_vcgtzq_f16,
1552 NEON::BI__builtin_neon_vcgtzq_v,
1555 NEON::BI__builtin_neon_vclez_f16,
1556 NEON::BI__builtin_neon_vclez_v,
1559 NEON::BI__builtin_neon_vclezq_f16,
1560 NEON::BI__builtin_neon_vclezq_v,
1563 NEON::BI__builtin_neon_vcltz_f16,
1564 NEON::BI__builtin_neon_vcltz_v,
1567 NEON::BI__builtin_neon_vcltzq_f16,
1568 NEON::BI__builtin_neon_vcltzq_v,
1571 NEON::BI__builtin_neon_vfma_f16,
1572 NEON::BI__builtin_neon_vfma_v,
1575 NEON::BI__builtin_neon_vfma_lane_f16,
1576 NEON::BI__builtin_neon_vfma_lane_v,
1579 NEON::BI__builtin_neon_vfma_laneq_f16,
1580 NEON::BI__builtin_neon_vfma_laneq_v,
1583 NEON::BI__builtin_neon_vfmaq_f16,
1584 NEON::BI__builtin_neon_vfmaq_v,
1587 NEON::BI__builtin_neon_vfmaq_lane_f16,
1588 NEON::BI__builtin_neon_vfmaq_lane_v,
1591 NEON::BI__builtin_neon_vfmaq_laneq_f16,
1592 NEON::BI__builtin_neon_vfmaq_laneq_v,
1594 {NEON::BI__builtin_neon_vld1_bf16_x2, NEON::BI__builtin_neon_vld1_x2_v},
1595 {NEON::BI__builtin_neon_vld1_bf16_x3, NEON::BI__builtin_neon_vld1_x3_v},
1596 {NEON::BI__builtin_neon_vld1_bf16_x4, NEON::BI__builtin_neon_vld1_x4_v},
1597 {NEON::BI__builtin_neon_vld1_bf16, NEON::BI__builtin_neon_vld1_v},
1598 {NEON::BI__builtin_neon_vld1_dup_bf16, NEON::BI__builtin_neon_vld1_dup_v},
1599 {NEON::BI__builtin_neon_vld1_lane_bf16, NEON::BI__builtin_neon_vld1_lane_v},
1600 {NEON::BI__builtin_neon_vld1q_bf16_x2, NEON::BI__builtin_neon_vld1q_x2_v},
1601 {NEON::BI__builtin_neon_vld1q_bf16_x3, NEON::BI__builtin_neon_vld1q_x3_v},
1602 {NEON::BI__builtin_neon_vld1q_bf16_x4, NEON::BI__builtin_neon_vld1q_x4_v},
1603 {NEON::BI__builtin_neon_vld1q_bf16, NEON::BI__builtin_neon_vld1q_v},
1604 {NEON::BI__builtin_neon_vld1q_dup_bf16, NEON::BI__builtin_neon_vld1q_dup_v},
1605 {NEON::BI__builtin_neon_vld1q_lane_bf16,
1606 NEON::BI__builtin_neon_vld1q_lane_v},
1607 {NEON::BI__builtin_neon_vld2_bf16, NEON::BI__builtin_neon_vld2_v},
1608 {NEON::BI__builtin_neon_vld2_dup_bf16, NEON::BI__builtin_neon_vld2_dup_v},
1609 {NEON::BI__builtin_neon_vld2_lane_bf16, NEON::BI__builtin_neon_vld2_lane_v},
1610 {NEON::BI__builtin_neon_vld2q_bf16, NEON::BI__builtin_neon_vld2q_v},
1611 {NEON::BI__builtin_neon_vld2q_dup_bf16, NEON::BI__builtin_neon_vld2q_dup_v},
1612 {NEON::BI__builtin_neon_vld2q_lane_bf16,
1613 NEON::BI__builtin_neon_vld2q_lane_v},
1614 {NEON::BI__builtin_neon_vld3_bf16, NEON::BI__builtin_neon_vld3_v},
1615 {NEON::BI__builtin_neon_vld3_dup_bf16, NEON::BI__builtin_neon_vld3_dup_v},
1616 {NEON::BI__builtin_neon_vld3_lane_bf16, NEON::BI__builtin_neon_vld3_lane_v},
1617 {NEON::BI__builtin_neon_vld3q_bf16, NEON::BI__builtin_neon_vld3q_v},
1618 {NEON::BI__builtin_neon_vld3q_dup_bf16, NEON::BI__builtin_neon_vld3q_dup_v},
1619 {NEON::BI__builtin_neon_vld3q_lane_bf16,
1620 NEON::BI__builtin_neon_vld3q_lane_v},
1621 {NEON::BI__builtin_neon_vld4_bf16, NEON::BI__builtin_neon_vld4_v},
1622 {NEON::BI__builtin_neon_vld4_dup_bf16, NEON::BI__builtin_neon_vld4_dup_v},
1623 {NEON::BI__builtin_neon_vld4_lane_bf16, NEON::BI__builtin_neon_vld4_lane_v},
1624 {NEON::BI__builtin_neon_vld4q_bf16, NEON::BI__builtin_neon_vld4q_v},
1625 {NEON::BI__builtin_neon_vld4q_dup_bf16, NEON::BI__builtin_neon_vld4q_dup_v},
1626 {NEON::BI__builtin_neon_vld4q_lane_bf16,
1627 NEON::BI__builtin_neon_vld4q_lane_v},
1629 NEON::BI__builtin_neon_vmax_f16,
1630 NEON::BI__builtin_neon_vmax_v,
1633 NEON::BI__builtin_neon_vmaxnm_f16,
1634 NEON::BI__builtin_neon_vmaxnm_v,
1637 NEON::BI__builtin_neon_vmaxnmq_f16,
1638 NEON::BI__builtin_neon_vmaxnmq_v,
1641 NEON::BI__builtin_neon_vmaxq_f16,
1642 NEON::BI__builtin_neon_vmaxq_v,
1645 NEON::BI__builtin_neon_vmin_f16,
1646 NEON::BI__builtin_neon_vmin_v,
1649 NEON::BI__builtin_neon_vminnm_f16,
1650 NEON::BI__builtin_neon_vminnm_v,
1653 NEON::BI__builtin_neon_vminnmq_f16,
1654 NEON::BI__builtin_neon_vminnmq_v,
1657 NEON::BI__builtin_neon_vminq_f16,
1658 NEON::BI__builtin_neon_vminq_v,
1661 NEON::BI__builtin_neon_vmulx_f16,
1662 NEON::BI__builtin_neon_vmulx_v,
1665 NEON::BI__builtin_neon_vmulxq_f16,
1666 NEON::BI__builtin_neon_vmulxq_v,
1669 NEON::BI__builtin_neon_vpadd_f16,
1670 NEON::BI__builtin_neon_vpadd_v,
1673 NEON::BI__builtin_neon_vpaddq_f16,
1674 NEON::BI__builtin_neon_vpaddq_v,
1677 NEON::BI__builtin_neon_vpmax_f16,
1678 NEON::BI__builtin_neon_vpmax_v,
1681 NEON::BI__builtin_neon_vpmaxnm_f16,
1682 NEON::BI__builtin_neon_vpmaxnm_v,
1685 NEON::BI__builtin_neon_vpmaxnmq_f16,
1686 NEON::BI__builtin_neon_vpmaxnmq_v,
1689 NEON::BI__builtin_neon_vpmaxq_f16,
1690 NEON::BI__builtin_neon_vpmaxq_v,
1693 NEON::BI__builtin_neon_vpmin_f16,
1694 NEON::BI__builtin_neon_vpmin_v,
1697 NEON::BI__builtin_neon_vpminnm_f16,
1698 NEON::BI__builtin_neon_vpminnm_v,
1701 NEON::BI__builtin_neon_vpminnmq_f16,
1702 NEON::BI__builtin_neon_vpminnmq_v,
1705 NEON::BI__builtin_neon_vpminq_f16,
1706 NEON::BI__builtin_neon_vpminq_v,
1709 NEON::BI__builtin_neon_vrecpe_f16,
1710 NEON::BI__builtin_neon_vrecpe_v,
1713 NEON::BI__builtin_neon_vrecpeq_f16,
1714 NEON::BI__builtin_neon_vrecpeq_v,
1717 NEON::BI__builtin_neon_vrecps_f16,
1718 NEON::BI__builtin_neon_vrecps_v,
1721 NEON::BI__builtin_neon_vrecpsq_f16,
1722 NEON::BI__builtin_neon_vrecpsq_v,
1725 NEON::BI__builtin_neon_vrnd_f16,
1726 NEON::BI__builtin_neon_vrnd_v,
1729 NEON::BI__builtin_neon_vrnda_f16,
1730 NEON::BI__builtin_neon_vrnda_v,
1733 NEON::BI__builtin_neon_vrndaq_f16,
1734 NEON::BI__builtin_neon_vrndaq_v,
1737 NEON::BI__builtin_neon_vrndi_f16,
1738 NEON::BI__builtin_neon_vrndi_v,
1741 NEON::BI__builtin_neon_vrndiq_f16,
1742 NEON::BI__builtin_neon_vrndiq_v,
1745 NEON::BI__builtin_neon_vrndm_f16,
1746 NEON::BI__builtin_neon_vrndm_v,
1749 NEON::BI__builtin_neon_vrndmq_f16,
1750 NEON::BI__builtin_neon_vrndmq_v,
1753 NEON::BI__builtin_neon_vrndn_f16,
1754 NEON::BI__builtin_neon_vrndn_v,
1757 NEON::BI__builtin_neon_vrndnq_f16,
1758 NEON::BI__builtin_neon_vrndnq_v,
1761 NEON::BI__builtin_neon_vrndp_f16,
1762 NEON::BI__builtin_neon_vrndp_v,
1765 NEON::BI__builtin_neon_vrndpq_f16,
1766 NEON::BI__builtin_neon_vrndpq_v,
1769 NEON::BI__builtin_neon_vrndq_f16,
1770 NEON::BI__builtin_neon_vrndq_v,
1773 NEON::BI__builtin_neon_vrndx_f16,
1774 NEON::BI__builtin_neon_vrndx_v,
1777 NEON::BI__builtin_neon_vrndxq_f16,
1778 NEON::BI__builtin_neon_vrndxq_v,
1781 NEON::BI__builtin_neon_vrsqrte_f16,
1782 NEON::BI__builtin_neon_vrsqrte_v,
1785 NEON::BI__builtin_neon_vrsqrteq_f16,
1786 NEON::BI__builtin_neon_vrsqrteq_v,
1789 NEON::BI__builtin_neon_vrsqrts_f16,
1790 NEON::BI__builtin_neon_vrsqrts_v,
1793 NEON::BI__builtin_neon_vrsqrtsq_f16,
1794 NEON::BI__builtin_neon_vrsqrtsq_v,
1797 NEON::BI__builtin_neon_vsqrt_f16,
1798 NEON::BI__builtin_neon_vsqrt_v,
1801 NEON::BI__builtin_neon_vsqrtq_f16,
1802 NEON::BI__builtin_neon_vsqrtq_v,
1804 {NEON::BI__builtin_neon_vst1_bf16_x2, NEON::BI__builtin_neon_vst1_x2_v},
1805 {NEON::BI__builtin_neon_vst1_bf16_x3, NEON::BI__builtin_neon_vst1_x3_v},
1806 {NEON::BI__builtin_neon_vst1_bf16_x4, NEON::BI__builtin_neon_vst1_x4_v},
1807 {NEON::BI__builtin_neon_vst1_bf16, NEON::BI__builtin_neon_vst1_v},
1808 {NEON::BI__builtin_neon_vst1_lane_bf16, NEON::BI__builtin_neon_vst1_lane_v},
1809 {NEON::BI__builtin_neon_vst1q_bf16_x2, NEON::BI__builtin_neon_vst1q_x2_v},
1810 {NEON::BI__builtin_neon_vst1q_bf16_x3, NEON::BI__builtin_neon_vst1q_x3_v},
1811 {NEON::BI__builtin_neon_vst1q_bf16_x4, NEON::BI__builtin_neon_vst1q_x4_v},
1812 {NEON::BI__builtin_neon_vst1q_bf16, NEON::BI__builtin_neon_vst1q_v},
1813 {NEON::BI__builtin_neon_vst1q_lane_bf16,
1814 NEON::BI__builtin_neon_vst1q_lane_v},
1815 {NEON::BI__builtin_neon_vst2_bf16, NEON::BI__builtin_neon_vst2_v},
1816 {NEON::BI__builtin_neon_vst2_lane_bf16, NEON::BI__builtin_neon_vst2_lane_v},
1817 {NEON::BI__builtin_neon_vst2q_bf16, NEON::BI__builtin_neon_vst2q_v},
1818 {NEON::BI__builtin_neon_vst2q_lane_bf16,
1819 NEON::BI__builtin_neon_vst2q_lane_v},
1820 {NEON::BI__builtin_neon_vst3_bf16, NEON::BI__builtin_neon_vst3_v},
1821 {NEON::BI__builtin_neon_vst3_lane_bf16, NEON::BI__builtin_neon_vst3_lane_v},
1822 {NEON::BI__builtin_neon_vst3q_bf16, NEON::BI__builtin_neon_vst3q_v},
1823 {NEON::BI__builtin_neon_vst3q_lane_bf16,
1824 NEON::BI__builtin_neon_vst3q_lane_v},
1825 {NEON::BI__builtin_neon_vst4_bf16, NEON::BI__builtin_neon_vst4_v},
1826 {NEON::BI__builtin_neon_vst4_lane_bf16, NEON::BI__builtin_neon_vst4_lane_v},
1827 {NEON::BI__builtin_neon_vst4q_bf16, NEON::BI__builtin_neon_vst4q_v},
1828 {NEON::BI__builtin_neon_vst4q_lane_bf16,
1829 NEON::BI__builtin_neon_vst4q_lane_v},
1833 {NEON::BI__builtin_neon_vldap1_lane_u64,
1834 NEON::BI__builtin_neon_vldap1_lane_s64},
1835 {NEON::BI__builtin_neon_vldap1_lane_f64,
1836 NEON::BI__builtin_neon_vldap1_lane_s64},
1837 {NEON::BI__builtin_neon_vldap1_lane_p64,
1838 NEON::BI__builtin_neon_vldap1_lane_s64},
1839 {NEON::BI__builtin_neon_vldap1q_lane_u64,
1840 NEON::BI__builtin_neon_vldap1q_lane_s64},
1841 {NEON::BI__builtin_neon_vldap1q_lane_f64,
1842 NEON::BI__builtin_neon_vldap1q_lane_s64},
1843 {NEON::BI__builtin_neon_vldap1q_lane_p64,
1844 NEON::BI__builtin_neon_vldap1q_lane_s64},
1845 {NEON::BI__builtin_neon_vstl1_lane_u64,
1846 NEON::BI__builtin_neon_vstl1_lane_s64},
1847 {NEON::BI__builtin_neon_vstl1_lane_f64,
1848 NEON::BI__builtin_neon_vstl1_lane_s64},
1849 {NEON::BI__builtin_neon_vstl1_lane_p64,
1850 NEON::BI__builtin_neon_vstl1_lane_s64},
1851 {NEON::BI__builtin_neon_vstl1q_lane_u64,
1852 NEON::BI__builtin_neon_vstl1q_lane_s64},
1853 {NEON::BI__builtin_neon_vstl1q_lane_f64,
1854 NEON::BI__builtin_neon_vstl1q_lane_s64},
1855 {NEON::BI__builtin_neon_vstl1q_lane_p64,
1856 NEON::BI__builtin_neon_vstl1q_lane_s64},
1862 llvm::Triple::ArchType arch) {
1871 if (builtinID == Builtin::BI__builtin_cpu_supports) {
1872 cgm.errorNYI(
expr->getSourceRange(),
1873 std::string(
"unimplemented AArch64 builtin call: ") +
1874 getContext().BuiltinInfo.getName(builtinID));
1875 return mlir::Value{};
1878 switch (builtinID) {
1881 case clang::AArch64::BI__builtin_arm_nop:
1882 case clang::AArch64::BI__builtin_arm_yield:
1883 case clang::AArch64::BI__yield:
1884 case clang::AArch64::BI__builtin_arm_wfe:
1885 case clang::AArch64::BI__wfe:
1886 case clang::AArch64::BI__builtin_arm_wfi:
1887 case clang::AArch64::BI__wfi:
1888 case clang::AArch64::BI__builtin_arm_sev:
1889 case clang::AArch64::BI__sev:
1890 case clang::AArch64::BI__builtin_arm_sevl:
1891 case clang::AArch64::BI__sevl:
1892 cgm.errorNYI(
expr->getSourceRange(),
1893 std::string(
"unimplemented AArch64 builtin call: ") +
1894 getContext().BuiltinInfo.getName(builtinID));
1895 return mlir::Value{};
1898 if (builtinID == clang::AArch64::BI__builtin_arm_trap) {
1899 cgm.errorNYI(
expr->getSourceRange(),
1900 std::string(
"unimplemented AArch64 builtin call: ") +
1901 getContext().BuiltinInfo.getName(builtinID));
1902 return mlir::Value{};
1905 if (builtinID == clang::AArch64::BI__builtin_arm_get_sme_state) {
1906 cgm.errorNYI(
expr->getSourceRange(),
1907 std::string(
"unimplemented AArch64 builtin call: ") +
1908 getContext().BuiltinInfo.getName(builtinID));
1909 return mlir::Value{};
1912 if (builtinID == clang::AArch64::BI__builtin_arm_rbit) {
1913 cgm.errorNYI(
expr->getSourceRange(),
1914 std::string(
"unimplemented AArch64 builtin call: ") +
1915 getContext().BuiltinInfo.getName(builtinID));
1916 return mlir::Value{};
1918 if (builtinID == clang::AArch64::BI__builtin_arm_rbit64) {
1919 cgm.errorNYI(
expr->getSourceRange(),
1920 std::string(
"unimplemented AArch64 builtin call: ") +
1921 getContext().BuiltinInfo.getName(builtinID));
1922 return mlir::Value{};
1925 if (builtinID == clang::AArch64::BI__builtin_arm_clz ||
1926 builtinID == clang::AArch64::BI__builtin_arm_clz64) {
1927 cgm.errorNYI(
expr->getSourceRange(),
1928 std::string(
"unimplemented AArch64 builtin call: ") +
1929 getContext().BuiltinInfo.getName(builtinID));
1930 return mlir::Value{};
1933 if (builtinID == clang::AArch64::BI__builtin_arm_cls) {
1934 cgm.errorNYI(
expr->getSourceRange(),
1935 std::string(
"unimplemented AArch64 builtin call: ") +
1936 getContext().BuiltinInfo.getName(builtinID));
1937 return mlir::Value{};
1939 if (builtinID == clang::AArch64::BI__builtin_arm_cls64) {
1940 cgm.errorNYI(
expr->getSourceRange(),
1941 std::string(
"unimplemented AArch64 builtin call: ") +
1942 getContext().BuiltinInfo.getName(builtinID));
1943 return mlir::Value{};
1946 if (builtinID == clang::AArch64::BI__builtin_arm_rint32zf ||
1947 builtinID == clang::AArch64::BI__builtin_arm_rint32z) {
1948 cgm.errorNYI(
expr->getSourceRange(),
1949 std::string(
"unimplemented AArch64 builtin call: ") +
1950 getContext().BuiltinInfo.getName(builtinID));
1951 return mlir::Value{};
1954 if (builtinID == clang::AArch64::BI__builtin_arm_rint64zf ||
1955 builtinID == clang::AArch64::BI__builtin_arm_rint64z) {
1956 cgm.errorNYI(
expr->getSourceRange(),
1957 std::string(
"unimplemented AArch64 builtin call: ") +
1958 getContext().BuiltinInfo.getName(builtinID));
1959 return mlir::Value{};
1962 if (builtinID == clang::AArch64::BI__builtin_arm_rint32xf ||
1963 builtinID == clang::AArch64::BI__builtin_arm_rint32x) {
1964 cgm.errorNYI(
expr->getSourceRange(),
1965 std::string(
"unimplemented AArch64 builtin call: ") +
1966 getContext().BuiltinInfo.getName(builtinID));
1967 return mlir::Value{};
1970 if (builtinID == clang::AArch64::BI__builtin_arm_rint64xf ||
1971 builtinID == clang::AArch64::BI__builtin_arm_rint64x) {
1972 cgm.errorNYI(
expr->getSourceRange(),
1973 std::string(
"unimplemented AArch64 builtin call: ") +
1974 getContext().BuiltinInfo.getName(builtinID));
1975 return mlir::Value{};
1978 if (builtinID == clang::AArch64::BI__builtin_arm_jcvt) {
1979 cgm.errorNYI(
expr->getSourceRange(),
1980 std::string(
"unimplemented AArch64 builtin call: ") +
1981 getContext().BuiltinInfo.getName(builtinID));
1982 return mlir::Value{};
1985 if (builtinID == clang::AArch64::BI__builtin_arm_ld64b ||
1986 builtinID == clang::AArch64::BI__builtin_arm_st64b ||
1987 builtinID == clang::AArch64::BI__builtin_arm_st64bv ||
1988 builtinID == clang::AArch64::BI__builtin_arm_st64bv0) {
1989 cgm.errorNYI(
expr->getSourceRange(),
1990 std::string(
"unimplemented AArch64 builtin call: ") +
1991 getContext().BuiltinInfo.getName(builtinID));
1992 return mlir::Value{};
1995 if (builtinID == clang::AArch64::BI__builtin_arm_rndr ||
1996 builtinID == clang::AArch64::BI__builtin_arm_rndrrs) {
1997 cgm.errorNYI(
expr->getSourceRange(),
1998 std::string(
"unimplemented AArch64 builtin call: ") +
1999 getContext().BuiltinInfo.getName(builtinID));
2000 return mlir::Value{};
2003 if (builtinID == clang::AArch64::BI__clear_cache) {
2004 cgm.errorNYI(
expr->getSourceRange(),
2005 std::string(
"unimplemented AArch64 builtin call: ") +
2006 getContext().BuiltinInfo.getName(builtinID));
2007 return mlir::Value{};
2010 if ((builtinID == clang::AArch64::BI__builtin_arm_ldrex ||
2011 builtinID == clang::AArch64::BI__builtin_arm_ldaex) &&
2013 cgm.errorNYI(
expr->getSourceRange(),
2014 std::string(
"unimplemented AArch64 builtin call: ") +
2015 getContext().BuiltinInfo.getName(builtinID));
2016 return mlir::Value{};
2018 if (builtinID == clang::AArch64::BI__builtin_arm_ldrex ||
2019 builtinID == clang::AArch64::BI__builtin_arm_ldaex) {
2020 cgm.errorNYI(
expr->getSourceRange(),
2021 std::string(
"unimplemented AArch64 builtin call: ") +
2022 getContext().BuiltinInfo.getName(builtinID));
2023 return mlir::Value{};
2026 if ((builtinID == clang::AArch64::BI__builtin_arm_strex ||
2027 builtinID == clang::AArch64::BI__builtin_arm_stlex) &&
2029 cgm.errorNYI(
expr->getSourceRange(),
2030 std::string(
"unimplemented AArch64 builtin call: ") +
2031 getContext().BuiltinInfo.getName(builtinID));
2032 return mlir::Value{};
2035 if (builtinID == clang::AArch64::BI__builtin_arm_strex ||
2036 builtinID == clang::AArch64::BI__builtin_arm_stlex) {
2037 cgm.errorNYI(
expr->getSourceRange(),
2038 std::string(
"unimplemented AArch64 builtin call: ") +
2039 getContext().BuiltinInfo.getName(builtinID));
2040 return mlir::Value{};
2043 if (builtinID == clang::AArch64::BI__getReg ||
2044 builtinID == clang::AArch64::BI__setReg ||
2045 builtinID == clang::AArch64::BI__getRegFp ||
2046 builtinID == clang::AArch64::BI__setRegFp) {
2047 cgm.errorNYI(
expr->getSourceRange(),
2048 std::string(
"unimplemented AArch64 builtin call: ") +
2049 getContext().BuiltinInfo.getName(builtinID));
2050 return mlir::Value{};
2053 if (builtinID == clang::AArch64::BI__break) {
2054 cgm.errorNYI(
expr->getSourceRange(),
2055 std::string(
"unimplemented AArch64 builtin call: ") +
2056 getContext().BuiltinInfo.getName(builtinID));
2057 return mlir::Value{};
2060 if (builtinID == clang::AArch64::BI__builtin_arm_clrex) {
2061 cgm.errorNYI(
expr->getSourceRange(),
2062 std::string(
"unimplemented AArch64 builtin call: ") +
2063 getContext().BuiltinInfo.getName(builtinID));
2064 return mlir::Value{};
2067 if (builtinID == clang::AArch64::BI_ReadWriteBarrier) {
2068 cgm.errorNYI(
expr->getSourceRange(),
2069 std::string(
"unimplemented AArch64 builtin call: ") +
2070 getContext().BuiltinInfo.getName(builtinID));
2071 return mlir::Value{};
2075 Intrinsic::ID crcIntrinsicID = Intrinsic::not_intrinsic;
2076 switch (builtinID) {
2077 case clang::AArch64::BI__builtin_arm_crc32b:
2078 crcIntrinsicID = Intrinsic::aarch64_crc32b;
2080 case clang::AArch64::BI__builtin_arm_crc32cb:
2081 crcIntrinsicID = Intrinsic::aarch64_crc32cb;
2083 case clang::AArch64::BI__builtin_arm_crc32h:
2084 crcIntrinsicID = Intrinsic::aarch64_crc32h;
2086 case clang::AArch64::BI__builtin_arm_crc32ch:
2087 crcIntrinsicID = Intrinsic::aarch64_crc32ch;
2089 case clang::AArch64::BI__builtin_arm_crc32w:
2090 crcIntrinsicID = Intrinsic::aarch64_crc32w;
2092 case clang::AArch64::BI__builtin_arm_crc32cw:
2093 crcIntrinsicID = Intrinsic::aarch64_crc32cw;
2095 case clang::AArch64::BI__builtin_arm_crc32d:
2096 crcIntrinsicID = Intrinsic::aarch64_crc32x;
2098 case clang::AArch64::BI__builtin_arm_crc32cd:
2099 crcIntrinsicID = Intrinsic::aarch64_crc32cx;
2103 if (crcIntrinsicID != Intrinsic::not_intrinsic) {
2104 cgm.errorNYI(
expr->getSourceRange(),
2105 std::string(
"unimplemented AArch64 builtin call: ") +
2106 getContext().BuiltinInfo.getName(builtinID));
2107 return mlir::Value{};
2111 if (builtinID == AArch64::BI__builtin_arm_mops_memset_tag) {
2112 cgm.errorNYI(
expr->getSourceRange(),
2113 std::string(
"unimplemented AArch64 builtin call: ") +
2114 getContext().BuiltinInfo.getName(builtinID));
2115 return mlir::Value{};
2119 Intrinsic::ID mteIntrinsicID = Intrinsic::not_intrinsic;
2120 switch (builtinID) {
2121 case clang::AArch64::BI__builtin_arm_irg:
2122 mteIntrinsicID = Intrinsic::aarch64_irg;
2124 case clang::AArch64::BI__builtin_arm_addg:
2125 mteIntrinsicID = Intrinsic::aarch64_addg;
2127 case clang::AArch64::BI__builtin_arm_gmi:
2128 mteIntrinsicID = Intrinsic::aarch64_gmi;
2130 case clang::AArch64::BI__builtin_arm_ldg:
2131 mteIntrinsicID = Intrinsic::aarch64_ldg;
2133 case clang::AArch64::BI__builtin_arm_stg:
2134 mteIntrinsicID = Intrinsic::aarch64_stg;
2136 case clang::AArch64::BI__builtin_arm_subp:
2137 mteIntrinsicID = Intrinsic::aarch64_subp;
2141 if (mteIntrinsicID != Intrinsic::not_intrinsic) {
2142 cgm.errorNYI(
expr->getSourceRange(),
2143 std::string(
"unimplemented AArch64 builtin call: ") +
2144 getContext().BuiltinInfo.getName(builtinID));
2145 return mlir::Value{};
2148 if (builtinID == clang::AArch64::BI__builtin_arm_rsr ||
2149 builtinID == clang::AArch64::BI__builtin_arm_rsr64 ||
2150 builtinID == clang::AArch64::BI__builtin_arm_rsr128 ||
2151 builtinID == clang::AArch64::BI__builtin_arm_rsrp ||
2152 builtinID == clang::AArch64::BI__builtin_arm_wsr ||
2153 builtinID == clang::AArch64::BI__builtin_arm_wsr64 ||
2154 builtinID == clang::AArch64::BI__builtin_arm_wsr128 ||
2155 builtinID == clang::AArch64::BI__builtin_arm_wsrp) {
2156 cgm.errorNYI(
expr->getSourceRange(),
2157 std::string(
"unimplemented AArch64 builtin call: ") +
2158 getContext().BuiltinInfo.getName(builtinID));
2159 return mlir::Value{};
2162 if (builtinID == clang::AArch64::BI_ReadStatusReg ||
2163 builtinID == clang::AArch64::BI_WriteStatusReg ||
2164 builtinID == clang::AArch64::BI__sys) {
2165 cgm.errorNYI(
expr->getSourceRange(),
2166 std::string(
"unimplemented AArch64 builtin call: ") +
2167 getContext().BuiltinInfo.getName(builtinID));
2168 return mlir::Value{};
2171 if (builtinID == clang::AArch64::BI_AddressOfReturnAddress) {
2172 cgm.errorNYI(
expr->getSourceRange(),
2173 std::string(
"unimplemented AArch64 builtin call: ") +
2174 getContext().BuiltinInfo.getName(builtinID));
2175 return mlir::Value{};
2178 if (builtinID == clang::AArch64::BI__builtin_sponentry) {
2179 cgm.errorNYI(
expr->getSourceRange(),
2180 std::string(
"unimplemented AArch64 builtin call: ") +
2181 getContext().BuiltinInfo.getName(builtinID));
2182 return mlir::Value{};
2185 if (builtinID == clang::AArch64::BI__mulh ||
2186 builtinID == clang::AArch64::BI__umulh) {
2187 cgm.errorNYI(
expr->getSourceRange(),
2188 std::string(
"unimplemented AArch64 builtin call: ") +
2189 getContext().BuiltinInfo.getName(builtinID));
2190 return mlir::Value{};
2193 if (builtinID == AArch64::BI__writex18byte ||
2194 builtinID == AArch64::BI__writex18word ||
2195 builtinID == AArch64::BI__writex18dword ||
2196 builtinID == AArch64::BI__writex18qword) {
2197 cgm.errorNYI(
expr->getSourceRange(),
2198 std::string(
"unimplemented AArch64 builtin call: ") +
2199 getContext().BuiltinInfo.getName(builtinID));
2200 return mlir::Value{};
2203 if (builtinID == AArch64::BI__readx18byte ||
2204 builtinID == AArch64::BI__readx18word ||
2205 builtinID == AArch64::BI__readx18dword ||
2206 builtinID == AArch64::BI__readx18qword) {
2207 cgm.errorNYI(
expr->getSourceRange(),
2208 std::string(
"unimplemented AArch64 builtin call: ") +
2209 getContext().BuiltinInfo.getName(builtinID));
2210 return mlir::Value{};
2213 if (builtinID == AArch64::BI__addx18byte ||
2214 builtinID == AArch64::BI__addx18word ||
2215 builtinID == AArch64::BI__addx18dword ||
2216 builtinID == AArch64::BI__addx18qword ||
2217 builtinID == AArch64::BI__incx18byte ||
2218 builtinID == AArch64::BI__incx18word ||
2219 builtinID == AArch64::BI__incx18dword ||
2220 builtinID == AArch64::BI__incx18qword) {
2221 cgm.errorNYI(
expr->getSourceRange(),
2222 std::string(
"unimplemented AArch64 builtin call: ") +
2223 getContext().BuiltinInfo.getName(builtinID));
2224 return mlir::Value{};
2227 if (builtinID == AArch64::BI_CopyDoubleFromInt64 ||
2228 builtinID == AArch64::BI_CopyFloatFromInt32 ||
2229 builtinID == AArch64::BI_CopyInt32FromFloat ||
2230 builtinID == AArch64::BI_CopyInt64FromDouble) {
2231 cgm.errorNYI(
expr->getSourceRange(),
2232 std::string(
"unimplemented AArch64 builtin call: ") +
2233 getContext().BuiltinInfo.getName(builtinID));
2234 return mlir::Value{};
2237 if (builtinID == AArch64::BI_CountLeadingOnes ||
2238 builtinID == AArch64::BI_CountLeadingOnes64 ||
2239 builtinID == AArch64::BI_CountLeadingZeros ||
2240 builtinID == AArch64::BI_CountLeadingZeros64) {
2241 cgm.errorNYI(
expr->getSourceRange(),
2242 std::string(
"unimplemented AArch64 builtin call: ") +
2243 getContext().BuiltinInfo.getName(builtinID));
2244 return mlir::Value{};
2247 if (builtinID == AArch64::BI_CountLeadingSigns ||
2248 builtinID == AArch64::BI_CountLeadingSigns64) {
2249 cgm.errorNYI(
expr->getSourceRange(),
2250 std::string(
"unimplemented AArch64 builtin call: ") +
2251 getContext().BuiltinInfo.getName(builtinID));
2252 return mlir::Value{};
2255 if (builtinID == AArch64::BI_CountOneBits ||
2256 builtinID == AArch64::BI_CountOneBits64 ||
2257 builtinID == AArch64::BI_CountTrailingZeros ||
2258 builtinID == AArch64::BI_CountTrailingZeros64) {
2259 cgm.errorNYI(
expr->getSourceRange(),
2260 std::string(
"unimplemented AArch64 builtin call: ") +
2261 getContext().BuiltinInfo.getName(builtinID));
2262 return mlir::Value{};
2265 if (builtinID == AArch64::BI__prefetch ||
2266 builtinID == AArch64::BI__prefetch2) {
2267 cgm.errorNYI(
expr->getSourceRange(),
2268 std::string(
"unimplemented AArch64 builtin call: ") +
2269 getContext().BuiltinInfo.getName(builtinID));
2270 return mlir::Value{};
2273 if (builtinID == AArch64::BI__hlt) {
2274 cgm.errorNYI(
expr->getSourceRange(),
2275 std::string(
"unimplemented AArch64 builtin call: ") +
2276 getContext().BuiltinInfo.getName(builtinID));
2277 return mlir::Value{};
2280 if (builtinID == NEON::BI__builtin_neon_vcvth_bf16_f32) {
2281 cgm.errorNYI(
expr->getSourceRange(),
2282 std::string(
"unimplemented AArch64 builtin call: ") +
2283 getContext().BuiltinInfo.getName(builtinID));
2284 return mlir::Value{};
2293 return p.first == builtinID;
2296 builtinID = it->second;
2301 unsigned iceArguments = 0;
2310 unsigned numArgs =
expr->getNumArgs() - (hasExtraArg ? 1 : 0);
2311 for (
unsigned i = 0, e = numArgs; i != e; i++) {
2313 switch (builtinID) {
2314 case NEON::BI__builtin_neon_vld1_v:
2315 case NEON::BI__builtin_neon_vld1q_v:
2316 case NEON::BI__builtin_neon_vld1_dup_v:
2317 case NEON::BI__builtin_neon_vld1q_dup_v:
2318 case NEON::BI__builtin_neon_vld1_lane_v:
2319 case NEON::BI__builtin_neon_vld1q_lane_v:
2320 case NEON::BI__builtin_neon_vst1_v:
2321 case NEON::BI__builtin_neon_vst1q_v:
2322 case NEON::BI__builtin_neon_vst1_lane_v:
2323 case NEON::BI__builtin_neon_vst1q_lane_v:
2324 case NEON::BI__builtin_neon_vldap1_lane_s64:
2325 case NEON::BI__builtin_neon_vldap1q_lane_s64:
2326 case NEON::BI__builtin_neon_vstl1_lane_s64:
2327 case NEON::BI__builtin_neon_vstl1q_lane_s64:
2331 expr->getSourceRange(),
2332 std::string(
"unimplemented AArch64 builtin argument handling ") +
2333 getContext().BuiltinInfo.getName(builtinID));
2351 const Expr *arg =
expr->getArg(
expr->getNumArgs() - 1);
2355 if (std::optional<llvm::APSInt> result =
2359 bool usgn =
type.isUnsigned();
2361 mlir::Location loc =
getLoc(
expr->getExprLoc());
2374 switch (builtinID) {
2377 case NEON::BI__builtin_neon_vabsh_f16: {
2378 return cir::FAbsOp::create(builder, loc, ops);
2380 case NEON::BI__builtin_neon_vaddq_p128: {
2381 cir::VectorType byteTy = cir::VectorType::get(builder.getUInt8Ty(), 16);
2382 ops[0] = builder.createBitcast(ops[0], byteTy);
2383 ops[1] = builder.createBitcast(ops[1], byteTy);
2384 mlir::Value result = builder.createXor(loc, ops[0], ops[1]);
2387 case NEON::BI__builtin_neon_vldrq_p128:
2388 case NEON::BI__builtin_neon_vstrq_p128:
2389 case NEON::BI__builtin_neon_vcvts_f32_u32:
2390 case NEON::BI__builtin_neon_vcvtd_f64_u64:
2391 case NEON::BI__builtin_neon_vcvts_f32_s32:
2392 case NEON::BI__builtin_neon_vcvtd_f64_s64:
2393 case NEON::BI__builtin_neon_vcvth_f16_u16:
2394 case NEON::BI__builtin_neon_vcvth_f16_u32:
2395 case NEON::BI__builtin_neon_vcvth_f16_u64:
2396 case NEON::BI__builtin_neon_vcvth_f16_s16:
2397 case NEON::BI__builtin_neon_vcvth_f16_s32:
2398 case NEON::BI__builtin_neon_vcvth_f16_s64:
2399 case NEON::BI__builtin_neon_vcvtah_u16_f16:
2400 case NEON::BI__builtin_neon_vcvtmh_u16_f16:
2401 case NEON::BI__builtin_neon_vcvtnh_u16_f16:
2402 case NEON::BI__builtin_neon_vcvtph_u16_f16:
2403 case NEON::BI__builtin_neon_vcvth_u16_f16:
2404 case NEON::BI__builtin_neon_vcvtah_s16_f16:
2405 case NEON::BI__builtin_neon_vcvtmh_s16_f16:
2406 case NEON::BI__builtin_neon_vcvtnh_s16_f16:
2407 case NEON::BI__builtin_neon_vcvtph_s16_f16:
2408 case NEON::BI__builtin_neon_vcvth_s16_f16:
2409 case NEON::BI__builtin_neon_vcaleh_f16:
2410 case NEON::BI__builtin_neon_vcalth_f16:
2411 case NEON::BI__builtin_neon_vcageh_f16:
2412 case NEON::BI__builtin_neon_vcagth_f16:
2413 case NEON::BI__builtin_neon_vcvth_n_s16_f16:
2414 case NEON::BI__builtin_neon_vcvth_n_u16_f16:
2415 case NEON::BI__builtin_neon_vcvth_n_f16_s16:
2416 case NEON::BI__builtin_neon_vcvth_n_f16_u16:
2417 case NEON::BI__builtin_neon_vpaddd_s64:
2418 case NEON::BI__builtin_neon_vpaddd_f64:
2419 case NEON::BI__builtin_neon_vpadds_f32:
2420 cgm.errorNYI(
expr->getSourceRange(),
2421 std::string(
"unimplemented AArch64 builtin call: ") +
2422 getContext().BuiltinInfo.getName(builtinID));
2423 return mlir::Value{};
2424 case NEON::BI__builtin_neon_vceqzd_s64:
2425 case NEON::BI__builtin_neon_vceqzd_f64:
2426 case NEON::BI__builtin_neon_vceqzs_f32:
2427 case NEON::BI__builtin_neon_vceqzh_f16:
2429 *
this, builder, loc, ops[0],
2431 case NEON::BI__builtin_neon_vcgezd_s64:
2432 case NEON::BI__builtin_neon_vcgezd_f64:
2433 case NEON::BI__builtin_neon_vcgezs_f32:
2434 case NEON::BI__builtin_neon_vcgezh_f16:
2435 case NEON::BI__builtin_neon_vclezd_s64:
2436 case NEON::BI__builtin_neon_vclezd_f64:
2437 case NEON::BI__builtin_neon_vclezs_f32:
2438 case NEON::BI__builtin_neon_vclezh_f16:
2439 case NEON::BI__builtin_neon_vcgtzd_s64:
2440 case NEON::BI__builtin_neon_vcgtzd_f64:
2441 case NEON::BI__builtin_neon_vcgtzs_f32:
2442 case NEON::BI__builtin_neon_vcgtzh_f16:
2443 case NEON::BI__builtin_neon_vcltzd_s64:
2444 case NEON::BI__builtin_neon_vcltzd_f64:
2445 case NEON::BI__builtin_neon_vcltzs_f32:
2446 case NEON::BI__builtin_neon_vcltzh_f16:
2447 case NEON::BI__builtin_neon_vceqzd_u64: {
2449 *
this, builder, loc, ops[0],
2452 case NEON::BI__builtin_neon_vceqd_f64:
2453 case NEON::BI__builtin_neon_vcled_f64:
2454 case NEON::BI__builtin_neon_vcltd_f64:
2455 case NEON::BI__builtin_neon_vcged_f64:
2456 case NEON::BI__builtin_neon_vcgtd_f64:
2457 case NEON::BI__builtin_neon_vceqs_f32:
2458 case NEON::BI__builtin_neon_vcles_f32:
2459 case NEON::BI__builtin_neon_vclts_f32:
2460 case NEON::BI__builtin_neon_vcges_f32:
2461 case NEON::BI__builtin_neon_vcgts_f32:
2462 case NEON::BI__builtin_neon_vceqh_f16:
2463 case NEON::BI__builtin_neon_vcleh_f16:
2464 case NEON::BI__builtin_neon_vclth_f16:
2465 case NEON::BI__builtin_neon_vcgeh_f16:
2466 case NEON::BI__builtin_neon_vcgth_f16:
2467 case NEON::BI__builtin_neon_vceqd_s64:
2468 case NEON::BI__builtin_neon_vceqd_u64:
2469 case NEON::BI__builtin_neon_vcgtd_s64:
2470 case NEON::BI__builtin_neon_vcgtd_u64:
2471 case NEON::BI__builtin_neon_vcltd_s64:
2472 case NEON::BI__builtin_neon_vcltd_u64:
2473 case NEON::BI__builtin_neon_vcged_u64:
2474 case NEON::BI__builtin_neon_vcged_s64:
2475 case NEON::BI__builtin_neon_vcled_u64:
2476 case NEON::BI__builtin_neon_vcled_s64:
2477 cgm.errorNYI(
expr->getSourceRange(),
2478 std::string(
"unimplemented AArch64 builtin call: ") +
2479 getContext().BuiltinInfo.getName(builtinID));
2480 return mlir::Value{};
2481 case NEON::BI__builtin_neon_vnegd_s64: {
2482 return builder.createNeg(loc, ops[0]);
2484 case NEON::BI__builtin_neon_vnegh_f16: {
2485 return builder.createFNeg(loc, ops[0]);
2487 case NEON::BI__builtin_neon_vtstd_s64:
2488 case NEON::BI__builtin_neon_vtstd_u64:
2489 case NEON::BI__builtin_neon_vset_lane_i8:
2490 case NEON::BI__builtin_neon_vset_lane_i16:
2491 case NEON::BI__builtin_neon_vset_lane_i32:
2492 case NEON::BI__builtin_neon_vset_lane_i64:
2493 case NEON::BI__builtin_neon_vset_lane_bf16:
2494 case NEON::BI__builtin_neon_vset_lane_f32:
2495 case NEON::BI__builtin_neon_vsetq_lane_i8:
2496 case NEON::BI__builtin_neon_vsetq_lane_i16:
2497 case NEON::BI__builtin_neon_vsetq_lane_i32:
2498 case NEON::BI__builtin_neon_vsetq_lane_i64:
2499 case NEON::BI__builtin_neon_vsetq_lane_bf16:
2500 case NEON::BI__builtin_neon_vsetq_lane_f32:
2501 case NEON::BI__builtin_neon_vset_lane_f64:
2502 case NEON::BI__builtin_neon_vset_lane_mf8:
2503 case NEON::BI__builtin_neon_vsetq_lane_mf8:
2504 case NEON::BI__builtin_neon_vsetq_lane_f64:
2505 cgm.errorNYI(
expr->getSourceRange(),
2506 std::string(
"unimplemented AArch64 builtin call: ") +
2507 getContext().BuiltinInfo.getName(builtinID));
2508 return mlir::Value{};
2510 case NEON::BI__builtin_neon_vget_lane_i8:
2511 case NEON::BI__builtin_neon_vdupb_lane_i8:
2512 case NEON::BI__builtin_neon_vgetq_lane_i8:
2513 case NEON::BI__builtin_neon_vdupb_laneq_i8:
2514 case NEON::BI__builtin_neon_vget_lane_mf8:
2515 case NEON::BI__builtin_neon_vdupb_lane_mf8:
2516 case NEON::BI__builtin_neon_vgetq_lane_mf8:
2517 case NEON::BI__builtin_neon_vdupb_laneq_mf8:
2518 case NEON::BI__builtin_neon_vget_lane_i16:
2519 case NEON::BI__builtin_neon_vduph_lane_i16:
2520 case NEON::BI__builtin_neon_vgetq_lane_i16:
2521 case NEON::BI__builtin_neon_vduph_laneq_i16:
2522 case NEON::BI__builtin_neon_vget_lane_i32:
2523 case NEON::BI__builtin_neon_vdups_lane_i32:
2524 case NEON::BI__builtin_neon_vdups_lane_f32:
2525 case NEON::BI__builtin_neon_vgetq_lane_i32:
2526 case NEON::BI__builtin_neon_vdups_laneq_i32:
2527 case NEON::BI__builtin_neon_vget_lane_i64:
2528 case NEON::BI__builtin_neon_vdupd_lane_i64:
2529 case NEON::BI__builtin_neon_vdupd_lane_f64:
2530 case NEON::BI__builtin_neon_vgetq_lane_i64:
2531 case NEON::BI__builtin_neon_vdupd_laneq_i64:
2532 case NEON::BI__builtin_neon_vget_lane_f32:
2533 case NEON::BI__builtin_neon_vget_lane_f64:
2534 case NEON::BI__builtin_neon_vgetq_lane_f32:
2535 case NEON::BI__builtin_neon_vdups_laneq_f32:
2536 case NEON::BI__builtin_neon_vgetq_lane_f64:
2537 case NEON::BI__builtin_neon_vdupd_laneq_f64:
2538 return cir::VecExtractOp::create(builder, loc, ops[0],
2540 case NEON::BI__builtin_neon_vaddh_f16:
2541 return builder.createFAdd(loc, ops[0], ops[1]);
2542 case NEON::BI__builtin_neon_vsubh_f16:
2543 return builder.createFSub(loc, ops[0], ops[1]);
2544 case NEON::BI__builtin_neon_vmulh_f16:
2545 return builder.createFMul(loc, ops[0], ops[1]);
2546 case NEON::BI__builtin_neon_vdivh_f16:
2547 return builder.createFDiv(loc, ops[0], ops[1]);
2548 case NEON::BI__builtin_neon_vfmah_f16:
2550 std::rotate(ops.begin(), ops.begin() + 1, ops.end());
2554 case NEON::BI__builtin_neon_vfmsh_f16:
2556 std::rotate(ops.begin(), ops.begin() + 1, ops.end());
2557 ops[0] = builder.createFNeg(loc, ops[0]);
2560 case NEON::BI__builtin_neon_vaddd_s64:
2561 case NEON::BI__builtin_neon_vaddd_u64:
2562 return builder.createAdd(loc, ops[0], ops[1]);
2563 case NEON::BI__builtin_neon_vsubd_s64:
2564 case NEON::BI__builtin_neon_vsubd_u64:
2565 case NEON::BI__builtin_neon_vqdmlalh_s16:
2566 case NEON::BI__builtin_neon_vqdmlslh_s16:
2567 cgm.errorNYI(
expr->getSourceRange(),
2568 std::string(
"unimplemented AArch64 builtin call: ") +
2569 getContext().BuiltinInfo.getName(builtinID));
2570 return mlir::Value{};
2571 case NEON::BI__builtin_neon_vqshlud_n_s64: {
2572 cir::IntType int64Type = builder.getSInt64Ty();
2578 case NEON::BI__builtin_neon_vqshld_n_u64:
2579 case NEON::BI__builtin_neon_vqshld_n_s64: {
2580 cir::IntType int64Type = builtinID == NEON::BI__builtin_neon_vqshld_n_u64
2581 ? builder.getUInt64Ty()
2582 : builder.getSInt64Ty();
2583 llvm::StringRef intrinsicName =
2584 builtinID == NEON::BI__builtin_neon_vqshld_n_u64 ?
"aarch64.neon.uqshl"
2585 :
"aarch64.neon.sqshl";
2590 case NEON::BI__builtin_neon_vrshrd_n_u64:
2591 case NEON::BI__builtin_neon_vrshrd_n_s64: {
2592 llvm::StringRef intrName = builtinID == NEON::BI__builtin_neon_vrshrd_n_s64
2593 ?
"aarch64.neon.srshl"
2594 :
"aarch64.neon.urshl";
2595 cir::IntType int64Ty = builtinID == NEON::BI__builtin_neon_vqshld_n_u64
2596 ? builder.getUInt64Ty()
2597 : builder.getSInt64Ty();
2601 ops[1] = builder.getSInt64(sv, loc);
2602 return emitNeonCall(
cgm, builder, {int64Ty, builder.getSInt64Ty()}, ops,
2603 intrName, int64Ty, loc);
2605 case NEON::BI__builtin_neon_vrsrad_n_u64:
2606 case NEON::BI__builtin_neon_vrsrad_n_s64: {
2607 cir::IntType int64Type = builtinID == NEON::BI__builtin_neon_vrsrad_n_u64
2608 ? builder.getUInt64Ty()
2609 : builder.getSInt64Ty();
2610 ops[2] = builder.createNeg(loc, ops[2]);
2611 const StringRef intrName = builtinID == NEON::BI__builtin_neon_vrsrad_n_u64
2612 ?
"aarch64.neon.urshl"
2613 :
"aarch64.neon.srshl";
2616 ops[1], builder.createIntCast(ops[2], builder.getSInt64Ty())};
2617 ops[1] = builder.emitIntrinsicCallOp(loc, intrName, int64Type, args);
2618 return builder.createAdd(loc, ops[0],
2619 builder.createBitcast(ops[1], int64Type));
2621 case NEON::BI__builtin_neon_vshld_n_s64:
2622 case NEON::BI__builtin_neon_vshld_n_u64: {
2624 std::optional<llvm::APSInt> amt =
2626 assert(amt &&
"Expected argument to be a constant");
2627 return builder.createShiftLeft(loc, ops[0], amt->getZExtValue());
2629 case NEON::BI__builtin_neon_vshrd_n_s64: {
2630 std::optional<llvm::APSInt> amt =
2632 assert(amt &&
"Expected argument to be a constant");
2633 return builder.createShiftRight(
2634 loc, ops[0], std::min(
static_cast<uint64_t
>(63), amt->getZExtValue()));
2636 case NEON::BI__builtin_neon_vshrd_n_u64: {
2637 std::optional<llvm::APSInt> amt =
2639 assert(amt &&
"Expected argument to be a constant");
2640 uint64_t shiftAmt = amt->getZExtValue();
2643 return builder.getConstInt(loc, builder.getUInt64Ty(), 0);
2644 return builder.createShiftRight(loc, ops[0], shiftAmt);
2646 case NEON::BI__builtin_neon_vsrad_n_s64: {
2647 std::optional<llvm::APSInt> amt =
2649 assert(amt &&
"Expected argument to be a constant");
2651 std::min(
static_cast<uint64_t
>(63), amt->getZExtValue());
2652 mlir::Value shifted =
2653 builder.createShiftRight(loc, ops[1],
static_cast<unsigned>(shiftAmt));
2654 return builder.createAdd(loc, ops[0], shifted);
2656 case NEON::BI__builtin_neon_vsrad_n_u64: {
2657 std::optional<llvm::APSInt> amt =
2659 assert(amt &&
"Expected argument to be a constant");
2660 uint64_t shiftAmt = amt->getZExtValue();
2664 mlir::Value shifted =
2665 builder.createShiftRight(loc, ops[1],
static_cast<unsigned>(shiftAmt));
2666 return builder.createAdd(loc, ops[0], shifted);
2668 case NEON::BI__builtin_neon_vqdmlalh_lane_s16:
2669 case NEON::BI__builtin_neon_vqdmlalh_laneq_s16:
2670 case NEON::BI__builtin_neon_vqdmlslh_lane_s16:
2671 case NEON::BI__builtin_neon_vqdmlslh_laneq_s16:
2672 case NEON::BI__builtin_neon_vqdmlals_s32:
2673 case NEON::BI__builtin_neon_vqdmlsls_s32:
2674 case NEON::BI__builtin_neon_vqdmlals_lane_s32:
2675 case NEON::BI__builtin_neon_vqdmlals_laneq_s32:
2676 case NEON::BI__builtin_neon_vqdmlsls_lane_s32:
2677 case NEON::BI__builtin_neon_vqdmlsls_laneq_s32: {
2678 cgm.errorNYI(
expr->getSourceRange(),
2679 std::string(
"unimplemented AArch64 builtin call: ") +
2680 getContext().BuiltinInfo.getName(builtinID));
2681 return mlir::Value{};
2683 case NEON::BI__builtin_neon_vget_lane_bf16:
2684 case NEON::BI__builtin_neon_vduph_lane_bf16:
2685 case NEON::BI__builtin_neon_vduph_lane_f16:
2686 case NEON::BI__builtin_neon_vgetq_lane_bf16:
2687 case NEON::BI__builtin_neon_vduph_laneq_bf16:
2688 case NEON::BI__builtin_neon_vduph_laneq_f16: {
2689 return cir::VecExtractOp::create(builder, loc, ops[0], ops[1]);
2691 case NEON::BI__builtin_neon_vcvt_bf16_f32:
2692 case NEON::BI__builtin_neon_vcvtq_low_bf16_f32:
2693 case NEON::BI__builtin_neon_vcvtq_high_bf16_f32:
2694 case clang::AArch64::BI_InterlockedAdd:
2695 case clang::AArch64::BI_InterlockedAdd_acq:
2696 case clang::AArch64::BI_InterlockedAdd_rel:
2697 case clang::AArch64::BI_InterlockedAdd_nf:
2698 case clang::AArch64::BI_InterlockedAdd64:
2699 case clang::AArch64::BI_InterlockedAdd64_acq:
2700 case clang::AArch64::BI_InterlockedAdd64_rel:
2701 case clang::AArch64::BI_InterlockedAdd64_nf:
2702 cgm.errorNYI(
expr->getSourceRange(),
2703 std::string(
"unimplemented AArch64 builtin call: ") +
2704 getContext().BuiltinInfo.getName(builtinID));
2705 return mlir::Value{};
2712 llvm::StringRef intrName;
2714 switch (builtinID) {
2716 return std::nullopt;
2717 case NEON::BI__builtin_neon_vbsl_v:
2718 case NEON::BI__builtin_neon_vbslq_v: {
2721 ops[0] = builder.createBitcast(ops[0], bitTy);
2722 ops[1] = builder.createBitcast(ops[1], bitTy);
2723 ops[2] = builder.createBitcast(ops[2], bitTy);
2725 ops[1] = builder.createAnd(loc, ops[0], ops[1]);
2726 ops[2] = builder.createAnd(loc, builder.createNot(ops[0]), ops[2]);
2727 ops[0] = builder.createOr(loc, ops[1], ops[2]);
2728 return builder.createBitcast(ops[0], ty);
2730 case NEON::BI__builtin_neon_vfma_lane_v:
2731 cgm.errorNYI(
expr->getSourceRange(),
2732 std::string(
"unimplemented AArch64 builtin call: ") +
2733 getContext().BuiltinInfo.getName(builtinID));
2734 return mlir::Value{};
2735 case NEON::BI__builtin_neon_vfmaq_lane_v: {
2736 mlir::Value addend = builder.createBitcast(ops[0], ty);
2737 mlir::Value multiplicand = builder.createBitcast(ops[1], ty);
2740 cir::VectorType sourceTy =
2741 cir::VectorType::get(ty.getElementType(), ty.getSize() / 2);
2742 mlir::Value laneSource = builder.createBitcast(ops[2], sourceTy);
2743 laneSource =
emitNeonSplat(builder, loc, laneSource, ops[3], ty.getSize());
2748 case NEON::BI__builtin_neon_vfma_laneq_v: {
2750 if (ty.getElementType() ==
cgm.doubleTy) {
2751 mlir::Value addend = builder.createBitcast(ops[0],
cgm.doubleTy);
2752 mlir::Value multiplicand = builder.createBitcast(ops[1],
cgm.doubleTy);
2755 cir::VectorType sourceTy = cir::VectorType::get(
cgm.doubleTy, 2);
2756 mlir::Value laneSource = builder.createBitcast(ops[2], sourceTy);
2757 laneSource = builder.createExtractElement(
2763 return builder.createBitcast(
2769 mlir::Value addend = builder.createBitcast(ops[0], ty);
2770 mlir::Value multiplicand = builder.createBitcast(ops[1], ty);
2773 cir::VectorType sourceTy =
2774 cir::VectorType::get(ty.getElementType(), ty.getSize() * 2);
2775 mlir::Value laneSource = builder.createBitcast(ops[2], sourceTy);
2776 laneSource =
emitNeonSplat(builder, loc, laneSource, ops[3], ty.getSize());
2781 case NEON::BI__builtin_neon_vfmaq_laneq_v:
2782 case NEON::BI__builtin_neon_vfmah_lane_f16:
2783 case NEON::BI__builtin_neon_vfmas_lane_f32:
2784 case NEON::BI__builtin_neon_vfmah_laneq_f16:
2785 case NEON::BI__builtin_neon_vfmas_laneq_f32:
2786 case NEON::BI__builtin_neon_vfmad_lane_f64:
2787 case NEON::BI__builtin_neon_vfmad_laneq_f64:
2788 cgm.errorNYI(
expr->getSourceRange(),
2789 std::string(
"unimplemented AArch64 builtin call: ") +
2790 getContext().BuiltinInfo.getName(builtinID));
2791 return mlir::Value{};
2792 case NEON::BI__builtin_neon_vmull_v: {
2793 intrName = usgn ?
"aarch64.neon.umull" :
"aarch64.neon.smull";
2795 intrName =
"aarch64.neon.pmull";
2796 cir::VectorType argTy = builder.getExtendedOrTruncatedElementVectorType(
2798 return emitNeonCall(
cgm, builder, {argTy, argTy}, ops, intrName, ty, loc);
2800 case NEON::BI__builtin_neon_vmax_v:
2801 case NEON::BI__builtin_neon_vmaxq_v:
2802 intrName = usgn ?
"aarch64.neon.umax" :
"aarch64.neon.smax";
2803 if (cir::isFPOrVectorOfFPType(ty))
2804 intrName =
"aarch64.neon.fmax";
2806 case NEON::BI__builtin_neon_vmaxh_f16:
2807 cgm.errorNYI(
expr->getSourceRange(),
2808 std::string(
"unimplemented AArch64 builtin call: ") +
2809 getContext().BuiltinInfo.getName(builtinID));
2810 return mlir::Value{};
2811 case NEON::BI__builtin_neon_vmin_v:
2812 case NEON::BI__builtin_neon_vminq_v:
2813 intrName = usgn ?
"aarch64.neon.umin" :
"aarch64.neon.smin";
2814 if (cir::isFPOrVectorOfFPType(ty))
2815 intrName =
"aarch64.neon.fmin";
2817 case NEON::BI__builtin_neon_vminh_f16:
2818 cgm.errorNYI(
expr->getSourceRange(),
2819 std::string(
"unimplemented AArch64 builtin call: ") +
2820 getContext().BuiltinInfo.getName(builtinID));
2821 return mlir::Value{};
2822 case NEON::BI__builtin_neon_vabd_v:
2823 case NEON::BI__builtin_neon_vabdq_v:
2824 intrName = usgn ?
"aarch64.neon.uabd" :
"aarch64.neon.sabd";
2825 if (cir::isFPOrVectorOfFPType(ty))
2826 intrName =
"aarch64.neon.fabd";
2828 case NEON::BI__builtin_neon_vpadal_v:
2829 case NEON::BI__builtin_neon_vpadalq_v: {
2830 intrName = usgn ?
"aarch64.neon.uaddlp" :
"aarch64.neon.saddlp";
2832 mlir::Value pairwiseSum =
2834 inputs, intrName, ty, loc);
2835 mlir::Value accumValue = builder.createBitcast(loc, ops[0], ty);
2836 return cir::AddOp::create(builder, loc, ty, pairwiseSum, accumValue);
2838 case NEON::BI__builtin_neon_vpmin_v:
2839 case NEON::BI__builtin_neon_vpminq_v:
2840 intrName = usgn ?
"aarch64.neon.uminp" :
"aarch64.neon.sminp";
2841 if (cir::isFPOrVectorOfFPType(ty))
2842 intrName =
"aarch64.neon.fminp";
2844 case NEON::BI__builtin_neon_vpmax_v:
2845 case NEON::BI__builtin_neon_vpmaxq_v:
2846 intrName = usgn ?
"aarch64.neon.umaxp" :
"aarch64.neon.smaxp";
2847 if (cir::isFPOrVectorOfFPType(ty))
2848 intrName =
"aarch64.neon.fmaxp";
2850 case NEON::BI__builtin_neon_vminnm_v:
2851 case NEON::BI__builtin_neon_vminnmq_v:
2852 intrName =
"aarch64.neon.fminnm";
2854 case NEON::BI__builtin_neon_vminnmh_f16:
2855 cgm.errorNYI(
expr->getSourceRange(),
2856 std::string(
"unimplemented AArch64 builtin call: ") +
2857 getContext().BuiltinInfo.getName(builtinID));
2858 return mlir::Value{};
2859 case NEON::BI__builtin_neon_vmaxnm_v:
2860 case NEON::BI__builtin_neon_vmaxnmq_v:
2861 intrName =
"aarch64.neon.fmaxnm";
2863 case NEON::BI__builtin_neon_vmaxnmh_f16:
2864 case NEON::BI__builtin_neon_vrecpss_f32:
2865 case NEON::BI__builtin_neon_vrecpsd_f64:
2866 case NEON::BI__builtin_neon_vrecpsh_f16:
2867 case NEON::BI__builtin_neon_vqshrun_n_v:
2868 cgm.errorNYI(
expr->getSourceRange(),
2869 std::string(
"unimplemented AArch64 builtin call: ") +
2870 getContext().BuiltinInfo.getName(builtinID));
2871 return mlir::Value{};
2872 case NEON::BI__builtin_neon_vqrshrun_n_v: {
2873 cir::VectorType argTy = builder.getExtendedOrTruncatedElementVectorType(
2876 "aarch64.neon.sqrshrun", ty, loc);
2878 case NEON::BI__builtin_neon_vqshrn_n_v:
2879 cgm.errorNYI(
expr->getSourceRange(),
2880 std::string(
"unimplemented AArch64 builtin call: ") +
2881 getContext().BuiltinInfo.getName(builtinID));
2882 return mlir::Value{};
2883 case NEON::BI__builtin_neon_vrshrn_n_v:
2884 cgm.errorNYI(
expr->getSourceRange(),
2885 std::string(
"unimplemented AArch64 builtin call: ") +
2886 getContext().BuiltinInfo.getName(builtinID));
2887 return mlir::Value{};
2888 case NEON::BI__builtin_neon_vqrshrn_n_v: {
2889 cir::VectorType argTy = builder.getExtendedOrTruncatedElementVectorType(
2891 llvm::StringRef intrName =
2892 usgn ?
"aarch64.neon.uqrshrn" :
"aarch64.neon.sqrshrn";
2896 case NEON::BI__builtin_neon_vrndah_f16:
2897 case NEON::BI__builtin_neon_vrnda_v:
2898 case NEON::BI__builtin_neon_vrndaq_v:
2899 case NEON::BI__builtin_neon_vrndih_f16:
2900 case NEON::BI__builtin_neon_vrndmh_f16:
2901 case NEON::BI__builtin_neon_vrndm_v:
2902 case NEON::BI__builtin_neon_vrndmq_v:
2903 case NEON::BI__builtin_neon_vrndnh_f16:
2904 case NEON::BI__builtin_neon_vrndn_v:
2905 case NEON::BI__builtin_neon_vrndnq_v:
2906 case NEON::BI__builtin_neon_vrndns_f32:
2907 case NEON::BI__builtin_neon_vrndph_f16:
2908 case NEON::BI__builtin_neon_vrndp_v:
2909 case NEON::BI__builtin_neon_vrndpq_v:
2910 case NEON::BI__builtin_neon_vrndxh_f16:
2911 case NEON::BI__builtin_neon_vrndx_v:
2912 case NEON::BI__builtin_neon_vrndxq_v:
2913 case NEON::BI__builtin_neon_vrndh_f16:
2914 case NEON::BI__builtin_neon_vrnd32x_f32:
2915 case NEON::BI__builtin_neon_vrnd32xq_f32:
2916 case NEON::BI__builtin_neon_vrnd32x_f64:
2917 case NEON::BI__builtin_neon_vrnd32xq_f64:
2918 case NEON::BI__builtin_neon_vrnd32z_f32:
2919 case NEON::BI__builtin_neon_vrnd32zq_f32:
2920 case NEON::BI__builtin_neon_vrnd32z_f64:
2921 case NEON::BI__builtin_neon_vrnd32zq_f64:
2922 case NEON::BI__builtin_neon_vrnd64x_f32:
2923 case NEON::BI__builtin_neon_vrnd64xq_f32:
2924 case NEON::BI__builtin_neon_vrnd64x_f64:
2925 case NEON::BI__builtin_neon_vrnd64xq_f64:
2926 case NEON::BI__builtin_neon_vrnd64z_f32:
2927 case NEON::BI__builtin_neon_vrnd64zq_f32:
2928 case NEON::BI__builtin_neon_vrnd64z_f64:
2929 case NEON::BI__builtin_neon_vrnd64zq_f64:
2930 case NEON::BI__builtin_neon_vrnd_v:
2931 case NEON::BI__builtin_neon_vrndq_v:
2932 cgm.errorNYI(
expr->getSourceRange(),
2933 std::string(
"unimplemented AArch64 builtin call: ") +
2934 getContext().BuiltinInfo.getName(builtinID));
2935 return mlir::Value{};
2936 case NEON::BI__builtin_neon_vcvt_f64_v:
2937 case NEON::BI__builtin_neon_vcvtq_f64_v:
2938 ops[0] = builder.createBitcast(ops[0], ty);
2941 return builder.createCast(loc, cir::CastKind::int_to_float, ops[0], ty);
2942 case NEON::BI__builtin_neon_vcvt_f64_f32:
2943 case NEON::BI__builtin_neon_vcvt_f32_f64:
2944 case NEON::BI__builtin_neon_vcvt_s32_v:
2945 case NEON::BI__builtin_neon_vcvt_u32_v:
2946 case NEON::BI__builtin_neon_vcvt_s64_v:
2947 case NEON::BI__builtin_neon_vcvt_u64_v:
2948 case NEON::BI__builtin_neon_vcvt_s16_f16:
2949 case NEON::BI__builtin_neon_vcvt_u16_f16:
2950 case NEON::BI__builtin_neon_vcvtq_s32_v:
2951 case NEON::BI__builtin_neon_vcvtq_u32_v:
2952 case NEON::BI__builtin_neon_vcvtq_s64_v:
2953 case NEON::BI__builtin_neon_vcvtq_u64_v:
2954 case NEON::BI__builtin_neon_vcvtq_s16_f16:
2955 case NEON::BI__builtin_neon_vcvtq_u16_f16:
2956 case NEON::BI__builtin_neon_vcvta_s16_f16:
2957 case NEON::BI__builtin_neon_vcvta_u16_f16:
2958 case NEON::BI__builtin_neon_vcvta_s32_v:
2959 case NEON::BI__builtin_neon_vcvtaq_s16_f16:
2960 case NEON::BI__builtin_neon_vcvtaq_s32_v:
2961 case NEON::BI__builtin_neon_vcvta_u32_v:
2962 case NEON::BI__builtin_neon_vcvtaq_u16_f16:
2963 case NEON::BI__builtin_neon_vcvtaq_u32_v:
2964 case NEON::BI__builtin_neon_vcvta_s64_v:
2965 case NEON::BI__builtin_neon_vcvtaq_s64_v:
2966 case NEON::BI__builtin_neon_vcvta_u64_v:
2967 case NEON::BI__builtin_neon_vcvtaq_u64_v:
2968 case NEON::BI__builtin_neon_vcvtm_s16_f16:
2969 case NEON::BI__builtin_neon_vcvtm_s32_v:
2970 case NEON::BI__builtin_neon_vcvtmq_s16_f16:
2971 case NEON::BI__builtin_neon_vcvtmq_s32_v:
2972 case NEON::BI__builtin_neon_vcvtm_u16_f16:
2973 case NEON::BI__builtin_neon_vcvtm_u32_v:
2974 case NEON::BI__builtin_neon_vcvtmq_u16_f16:
2975 case NEON::BI__builtin_neon_vcvtmq_u32_v:
2976 case NEON::BI__builtin_neon_vcvtm_s64_v:
2977 case NEON::BI__builtin_neon_vcvtmq_s64_v:
2978 case NEON::BI__builtin_neon_vcvtm_u64_v:
2979 case NEON::BI__builtin_neon_vcvtmq_u64_v:
2980 case NEON::BI__builtin_neon_vcvtn_s16_f16:
2981 case NEON::BI__builtin_neon_vcvtn_s32_v:
2982 case NEON::BI__builtin_neon_vcvtnq_s16_f16:
2983 case NEON::BI__builtin_neon_vcvtnq_s32_v:
2984 case NEON::BI__builtin_neon_vcvtn_u16_f16:
2985 case NEON::BI__builtin_neon_vcvtn_u32_v:
2986 case NEON::BI__builtin_neon_vcvtnq_u16_f16:
2987 case NEON::BI__builtin_neon_vcvtnq_u32_v:
2988 case NEON::BI__builtin_neon_vcvtn_s64_v:
2989 case NEON::BI__builtin_neon_vcvtnq_s64_v:
2990 case NEON::BI__builtin_neon_vcvtn_u64_v:
2991 case NEON::BI__builtin_neon_vcvtnq_u64_v:
2992 case NEON::BI__builtin_neon_vcvtp_s16_f16:
2993 case NEON::BI__builtin_neon_vcvtp_s32_v:
2994 case NEON::BI__builtin_neon_vcvtpq_s16_f16:
2995 case NEON::BI__builtin_neon_vcvtpq_s32_v:
2996 case NEON::BI__builtin_neon_vcvtp_u16_f16:
2997 case NEON::BI__builtin_neon_vcvtp_u32_v:
2998 case NEON::BI__builtin_neon_vcvtpq_u16_f16:
2999 case NEON::BI__builtin_neon_vcvtpq_u32_v:
3000 case NEON::BI__builtin_neon_vcvtp_s64_v:
3001 case NEON::BI__builtin_neon_vcvtpq_s64_v:
3002 case NEON::BI__builtin_neon_vcvtp_u64_v:
3003 case NEON::BI__builtin_neon_vcvtpq_u64_v:
3004 case NEON::BI__builtin_neon_vmulx_v:
3005 case NEON::BI__builtin_neon_vmulxq_v:
3006 case NEON::BI__builtin_neon_vmulxh_lane_f16:
3007 case NEON::BI__builtin_neon_vmulxh_laneq_f16:
3008 case NEON::BI__builtin_neon_vmul_lane_v:
3009 case NEON::BI__builtin_neon_vmul_laneq_v:
3010 case NEON::BI__builtin_neon_vpmaxnm_v:
3011 case NEON::BI__builtin_neon_vpmaxnmq_v:
3012 cgm.errorNYI(
expr->getSourceRange(),
3013 std::string(
"unimplemented AArch64 builtin call: ") +
3014 getContext().BuiltinInfo.getName(builtinID));
3015 return mlir::Value{};
3016 case NEON::BI__builtin_neon_vpminnm_v:
3017 case NEON::BI__builtin_neon_vpminnmq_v:
3018 intrName =
"aarch64.neon.fminnmp";
3020 case NEON::BI__builtin_neon_vsqrth_f16:
3021 cgm.errorNYI(
expr->getSourceRange(),
3022 std::string(
"unimplemented AArch64 builtin call: ") +
3023 getContext().BuiltinInfo.getName(builtinID));
3024 return mlir::Value{};
3025 case NEON::BI__builtin_neon_vsqrt_v:
3026 case NEON::BI__builtin_neon_vsqrtq_v:
3029 case NEON::BI__builtin_neon_vrbit_v:
3030 case NEON::BI__builtin_neon_vrbitq_v:
3031 case NEON::BI__builtin_neon_vmaxv_f16:
3032 case NEON::BI__builtin_neon_vmaxvq_f16:
3033 case NEON::BI__builtin_neon_vminv_f16:
3034 case NEON::BI__builtin_neon_vminvq_f16:
3035 case NEON::BI__builtin_neon_vmaxnmv_f16:
3036 case NEON::BI__builtin_neon_vmaxnmvq_f16:
3037 case NEON::BI__builtin_neon_vminnmv_f16:
3038 case NEON::BI__builtin_neon_vminnmvq_f16:
3039 case NEON::BI__builtin_neon_vmul_n_f64:
3040 cgm.errorNYI(
expr->getSourceRange(),
3041 std::string(
"unimplemented AArch64 builtin call: ") +
3042 getContext().BuiltinInfo.getName(builtinID));
3043 return mlir::Value{};
3044 case NEON::BI__builtin_neon_vaddlv_u8:
3045 case NEON::BI__builtin_neon_vaddlvq_u8:
3046 case NEON::BI__builtin_neon_vaddlv_u16:
3047 case NEON::BI__builtin_neon_vaddlvq_u16:
3048 case NEON::BI__builtin_neon_vaddlv_s8:
3049 case NEON::BI__builtin_neon_vaddlvq_s8:
3050 case NEON::BI__builtin_neon_vaddlv_s16:
3051 case NEON::BI__builtin_neon_vaddlvq_s16: {
3054 auto eltTy = mlir::cast<cir::IntType>(
3055 mlir::cast<cir::VectorType>(argTy).getElementType());
3060 bool needsTrunc = eltTy.getWidth() == 8;
3061 intrName =
isUnsigned ?
"aarch64.neon.uaddlv" :
"aarch64.neon.saddlv";
3062 mlir::Type intrRetTy = userRetTy;
3064 intrRetTy =
isUnsigned ? builder.getUInt32Ty() : builder.getSInt32Ty();
3065 mlir::Value result =
3068 result = builder.createIntCast(result, userRetTy);
3071 case NEON::BI__builtin_neon_vsri_n_v:
3072 case NEON::BI__builtin_neon_vsriq_n_v: {
3074 ops[0], ops[1], builder.createIntCast(ops[2], builder.getUInt32Ty())};
3075 return emitNeonCall(
cgm, builder, {ty, ty, builder.getUInt32Ty()}, vsriArgs,
3076 "aarch64.neon.vsri", ty, loc);
3078 case NEON::BI__builtin_neon_vsli_n_v:
3079 case NEON::BI__builtin_neon_vsliq_n_v: {
3081 intrName =
"aarch64.neon.vsli";
3089 case NEON::BI__builtin_neon_vsra_n_v:
3090 case NEON::BI__builtin_neon_vsraq_n_v: {
3091 ops[0] = builder.createBitcast(ops[0], ty);
3093 return builder.createAdd(loc, ops[0], ops[1]);
3095 case NEON::BI__builtin_neon_vrsra_n_v:
3096 case NEON::BI__builtin_neon_vrsraq_n_v: {
3097 intrName = usgn ?
"aarch64.neon.urshl" :
"aarch64.neon.srshl";
3100 cir::VectorType shiftAmtVecTy =
3103 mlir::Value tmp =
emitNeonCall(
cgm, builder, {ty, shiftAmtVecTy}, tmpOps,
3107 ops[0] = builder.createBitcast(ops[0], ty);
3108 return builder.createAdd(loc, ops[0], tmp);
3110 case NEON::BI__builtin_neon_vld1_v:
3111 case NEON::BI__builtin_neon_vld1q_v:
3112 case NEON::BI__builtin_neon_vst1_v:
3113 case NEON::BI__builtin_neon_vst1q_v:
3114 case NEON::BI__builtin_neon_vld1_lane_v:
3115 case NEON::BI__builtin_neon_vld1q_lane_v:
3116 case NEON::BI__builtin_neon_vldap1_lane_s64:
3117 case NEON::BI__builtin_neon_vldap1q_lane_s64:
3118 case NEON::BI__builtin_neon_vld1_dup_v:
3119 case NEON::BI__builtin_neon_vld1q_dup_v:
3120 case NEON::BI__builtin_neon_vst1_lane_v:
3121 case NEON::BI__builtin_neon_vst1q_lane_v:
3122 case NEON::BI__builtin_neon_vstl1_lane_s64:
3123 case NEON::BI__builtin_neon_vstl1q_lane_s64:
3124 case NEON::BI__builtin_neon_vld2_v:
3125 case NEON::BI__builtin_neon_vld2q_v:
3126 case NEON::BI__builtin_neon_vld3_v:
3127 case NEON::BI__builtin_neon_vld3q_v:
3128 case NEON::BI__builtin_neon_vld4_v:
3129 case NEON::BI__builtin_neon_vld4q_v:
3130 case NEON::BI__builtin_neon_vld2_dup_v:
3131 case NEON::BI__builtin_neon_vld2q_dup_v:
3132 case NEON::BI__builtin_neon_vld3_dup_v:
3133 case NEON::BI__builtin_neon_vld3q_dup_v:
3134 case NEON::BI__builtin_neon_vld4_dup_v:
3135 case NEON::BI__builtin_neon_vld4q_dup_v:
3136 case NEON::BI__builtin_neon_vld2_lane_v:
3137 case NEON::BI__builtin_neon_vld2q_lane_v:
3138 case NEON::BI__builtin_neon_vld3_lane_v:
3139 case NEON::BI__builtin_neon_vld3q_lane_v:
3140 case NEON::BI__builtin_neon_vld4_lane_v:
3141 case NEON::BI__builtin_neon_vld4q_lane_v:
3142 case NEON::BI__builtin_neon_vst2_v:
3143 case NEON::BI__builtin_neon_vst2q_v:
3144 case NEON::BI__builtin_neon_vst2_lane_v:
3145 case NEON::BI__builtin_neon_vst2q_lane_v:
3146 case NEON::BI__builtin_neon_vst3_v:
3147 case NEON::BI__builtin_neon_vst3q_v:
3148 case NEON::BI__builtin_neon_vst3_lane_v:
3149 case NEON::BI__builtin_neon_vst3q_lane_v:
3150 case NEON::BI__builtin_neon_vst4_v:
3151 case NEON::BI__builtin_neon_vst4q_v:
3152 case NEON::BI__builtin_neon_vst4_lane_v:
3153 case NEON::BI__builtin_neon_vst4q_lane_v:
3154 cgm.errorNYI(
expr->getSourceRange(),
3155 std::string(
"unimplemented AArch64 builtin call: ") +
3156 getContext().BuiltinInfo.getName(builtinID));
3157 return mlir::Value{};
3158 case NEON::BI__builtin_neon_vtrn_v:
3159 case NEON::BI__builtin_neon_vtrnq_v: {
3160 ops[1] = builder.createBitcast(ops[1], ty);
3161 ops[2] = builder.createBitcast(ops[2], ty);
3163 mlir::Value baseAddr =
3164 builder.createBitcast(ops[0], builder.getPointerTo(ty));
3167 for (
unsigned vi = 0; vi != 2; ++vi) {
3169 for (
unsigned i = 0, e = ty.getSize(); i != e; i += 2) {
3170 indices.push_back(i + vi);
3171 indices.push_back(i + e + vi);
3173 cir::ConstantOp idx = builder.getConstInt(loc, builder.getSInt32Ty(), vi);
3174 mlir::Value addr = builder.createPtrStride(loc, baseAddr, idx);
3175 sv = builder.createVecShuffle(loc, ops[1], ops[2], indices);
3176 (void)builder.CIRBaseBuilderTy::createStore(loc, sv, addr);
3180 case NEON::BI__builtin_neon_vuzp_v:
3181 case NEON::BI__builtin_neon_vuzpq_v: {
3182 ops[1] = builder.createBitcast(ops[1], ty);
3183 ops[2] = builder.createBitcast(ops[2], ty);
3185 mlir::Value baseAddr =
3186 builder.createBitcast(ops[0], builder.getPointerTo(ty));
3188 for (
unsigned vi = 0; vi != 2; ++vi) {
3190 for (
unsigned i = 0, e = ty.getSize(); i != e; ++i) {
3191 indices.push_back(2 * i + vi);
3193 cir::ConstantOp idx = builder.getConstInt(loc, builder.getSInt32Ty(), vi);
3194 mlir::Value addr = builder.createPtrStride(loc, baseAddr, idx);
3195 sv = builder.createVecShuffle(loc, ops[1], ops[2], indices);
3196 (void)builder.CIRBaseBuilderTy::createStore(loc, sv, addr);
3200 case NEON::BI__builtin_neon_vzip_v:
3201 case NEON::BI__builtin_neon_vzipq_v: {
3202 ops[1] = builder.createBitcast(ops[1], ty);
3203 ops[2] = builder.createBitcast(ops[2], ty);
3205 mlir::Value baseAddr =
3206 builder.createBitcast(ops[0], builder.getPointerTo(ty));
3208 for (
unsigned vi = 0; vi != 2; ++vi) {
3210 for (
unsigned i = 0, e = ty.getSize(); i != e; i += 2) {
3211 indices.push_back((i + vi * e) >> 1);
3212 indices.push_back(((i + vi * e) >> 1) + e);
3214 cir::ConstantOp idx = builder.getConstInt(loc, builder.getSInt32Ty(), vi);
3215 mlir::Value addr = builder.createPtrStride(loc, baseAddr, idx);
3216 sv = builder.createVecShuffle(loc, ops[1], ops[2], indices);
3217 (void)builder.CIRBaseBuilderTy::createStore(loc, sv, addr);
3221 case NEON::BI__builtin_neon_vqtbl1q_v:
3222 case NEON::BI__builtin_neon_vqtbl2q_v:
3223 case NEON::BI__builtin_neon_vqtbl3q_v:
3224 case NEON::BI__builtin_neon_vqtbl4q_v:
3225 case NEON::BI__builtin_neon_vqtbx1q_v:
3226 case NEON::BI__builtin_neon_vqtbx2q_v:
3227 case NEON::BI__builtin_neon_vqtbx3q_v:
3228 case NEON::BI__builtin_neon_vqtbx4q_v:
3229 case NEON::BI__builtin_neon_vsqadd_v:
3230 case NEON::BI__builtin_neon_vsqaddq_v:
3231 case NEON::BI__builtin_neon_vuqadd_v:
3232 case NEON::BI__builtin_neon_vuqaddq_v:
3233 case NEON::BI__builtin_neon_vluti2_laneq_mf8:
3234 case NEON::BI__builtin_neon_vluti2_laneq_bf16:
3235 case NEON::BI__builtin_neon_vluti2_laneq_f16:
3236 case NEON::BI__builtin_neon_vluti2_laneq_p16:
3237 case NEON::BI__builtin_neon_vluti2_laneq_p8:
3238 case NEON::BI__builtin_neon_vluti2_laneq_s16:
3239 case NEON::BI__builtin_neon_vluti2_laneq_s8:
3240 case NEON::BI__builtin_neon_vluti2_laneq_u16:
3241 case NEON::BI__builtin_neon_vluti2_laneq_u8:
3242 case NEON::BI__builtin_neon_vluti2q_laneq_mf8:
3243 case NEON::BI__builtin_neon_vluti2q_laneq_bf16:
3244 case NEON::BI__builtin_neon_vluti2q_laneq_f16:
3245 case NEON::BI__builtin_neon_vluti2q_laneq_p16:
3246 case NEON::BI__builtin_neon_vluti2q_laneq_p8:
3247 case NEON::BI__builtin_neon_vluti2q_laneq_s16:
3248 case NEON::BI__builtin_neon_vluti2q_laneq_s8:
3249 case NEON::BI__builtin_neon_vluti2q_laneq_u16:
3250 case NEON::BI__builtin_neon_vluti2q_laneq_u8:
3251 case NEON::BI__builtin_neon_vluti2_lane_mf8:
3252 case NEON::BI__builtin_neon_vluti2_lane_bf16:
3253 case NEON::BI__builtin_neon_vluti2_lane_f16:
3254 case NEON::BI__builtin_neon_vluti2_lane_p16:
3255 case NEON::BI__builtin_neon_vluti2_lane_p8:
3256 case NEON::BI__builtin_neon_vluti2_lane_s16:
3257 case NEON::BI__builtin_neon_vluti2_lane_s8:
3258 case NEON::BI__builtin_neon_vluti2_lane_u16:
3259 case NEON::BI__builtin_neon_vluti2_lane_u8:
3260 case NEON::BI__builtin_neon_vluti2q_lane_mf8:
3261 case NEON::BI__builtin_neon_vluti2q_lane_bf16:
3262 case NEON::BI__builtin_neon_vluti2q_lane_f16:
3263 case NEON::BI__builtin_neon_vluti2q_lane_p16:
3264 case NEON::BI__builtin_neon_vluti2q_lane_p8:
3265 case NEON::BI__builtin_neon_vluti2q_lane_s16:
3266 case NEON::BI__builtin_neon_vluti2q_lane_s8:
3267 case NEON::BI__builtin_neon_vluti2q_lane_u16:
3268 case NEON::BI__builtin_neon_vluti2q_lane_u8:
3269 case NEON::BI__builtin_neon_vluti4q_lane_mf8:
3270 case NEON::BI__builtin_neon_vluti4q_lane_p8:
3271 case NEON::BI__builtin_neon_vluti4q_lane_s8:
3272 case NEON::BI__builtin_neon_vluti4q_lane_u8:
3273 case NEON::BI__builtin_neon_vluti4q_laneq_mf8:
3274 case NEON::BI__builtin_neon_vluti4q_laneq_p8:
3275 case NEON::BI__builtin_neon_vluti4q_laneq_s8:
3276 case NEON::BI__builtin_neon_vluti4q_laneq_u8:
3277 case NEON::BI__builtin_neon_vluti4q_lane_bf16_x2:
3278 case NEON::BI__builtin_neon_vluti4q_lane_f16_x2:
3279 case NEON::BI__builtin_neon_vluti4q_lane_p16_x2:
3280 case NEON::BI__builtin_neon_vluti4q_lane_s16_x2:
3281 case NEON::BI__builtin_neon_vluti4q_lane_u16_x2:
3282 case NEON::BI__builtin_neon_vluti4q_laneq_bf16_x2:
3283 case NEON::BI__builtin_neon_vluti4q_laneq_f16_x2:
3284 case NEON::BI__builtin_neon_vluti4q_laneq_p16_x2:
3285 case NEON::BI__builtin_neon_vluti4q_laneq_s16_x2:
3286 case NEON::BI__builtin_neon_vluti4q_laneq_u16_x2:
3287 case NEON::BI__builtin_neon_vmmlaq_f16_mf8_fpm:
3288 case NEON::BI__builtin_neon_vmmlaq_f32_mf8_fpm:
3289 case NEON::BI__builtin_neon_vcvt1_low_bf16_mf8_fpm:
3290 case NEON::BI__builtin_neon_vcvt1_bf16_mf8_fpm:
3291 case NEON::BI__builtin_neon_vcvt1_high_bf16_mf8_fpm:
3292 case NEON::BI__builtin_neon_vcvt2_low_bf16_mf8_fpm:
3293 case NEON::BI__builtin_neon_vcvt2_bf16_mf8_fpm:
3294 case NEON::BI__builtin_neon_vcvt2_high_bf16_mf8_fpm:
3295 case NEON::BI__builtin_neon_vcvt1_low_f16_mf8_fpm:
3296 case NEON::BI__builtin_neon_vcvt1_f16_mf8_fpm:
3297 case NEON::BI__builtin_neon_vcvt1_high_f16_mf8_fpm:
3298 case NEON::BI__builtin_neon_vcvt2_low_f16_mf8_fpm:
3299 case NEON::BI__builtin_neon_vcvt2_f16_mf8_fpm:
3300 case NEON::BI__builtin_neon_vcvt2_high_f16_mf8_fpm:
3301 case NEON::BI__builtin_neon_vcvt_mf8_f32_fpm:
3302 case NEON::BI__builtin_neon_vcvt_mf8_f16_fpm:
3303 case NEON::BI__builtin_neon_vcvtq_mf8_f16_fpm:
3304 case NEON::BI__builtin_neon_vcvt_high_mf8_f32_fpm:
3305 case NEON::BI__builtin_neon_vdot_f16_mf8_fpm:
3306 case NEON::BI__builtin_neon_vdotq_f16_mf8_fpm:
3307 case NEON::BI__builtin_neon_vdot_lane_f16_mf8_fpm:
3308 case NEON::BI__builtin_neon_vdotq_lane_f16_mf8_fpm:
3309 case NEON::BI__builtin_neon_vdot_laneq_f16_mf8_fpm:
3310 case NEON::BI__builtin_neon_vdotq_laneq_f16_mf8_fpm:
3311 case NEON::BI__builtin_neon_vdot_f32_mf8_fpm:
3312 case NEON::BI__builtin_neon_vdotq_f32_mf8_fpm:
3313 case NEON::BI__builtin_neon_vdot_lane_f32_mf8_fpm:
3314 case NEON::BI__builtin_neon_vdotq_lane_f32_mf8_fpm:
3315 case NEON::BI__builtin_neon_vdot_laneq_f32_mf8_fpm:
3316 case NEON::BI__builtin_neon_vdotq_laneq_f32_mf8_fpm:
3317 case NEON::BI__builtin_neon_vmlalbq_f16_mf8_fpm:
3318 case NEON::BI__builtin_neon_vmlaltq_f16_mf8_fpm:
3319 case NEON::BI__builtin_neon_vmlallbbq_f32_mf8_fpm:
3320 case NEON::BI__builtin_neon_vmlallbtq_f32_mf8_fpm:
3321 case NEON::BI__builtin_neon_vmlalltbq_f32_mf8_fpm:
3322 case NEON::BI__builtin_neon_vmlallttq_f32_mf8_fpm:
3323 case NEON::BI__builtin_neon_vmlalbq_lane_f16_mf8_fpm:
3324 case NEON::BI__builtin_neon_vmlalbq_laneq_f16_mf8_fpm:
3325 case NEON::BI__builtin_neon_vmlaltq_lane_f16_mf8_fpm:
3326 case NEON::BI__builtin_neon_vmlaltq_laneq_f16_mf8_fpm:
3327 case NEON::BI__builtin_neon_vmlallbbq_lane_f32_mf8_fpm:
3328 case NEON::BI__builtin_neon_vmlallbbq_laneq_f32_mf8_fpm:
3329 case NEON::BI__builtin_neon_vmlallbtq_lane_f32_mf8_fpm:
3330 case NEON::BI__builtin_neon_vmlallbtq_laneq_f32_mf8_fpm:
3331 case NEON::BI__builtin_neon_vmlalltbq_lane_f32_mf8_fpm:
3332 case NEON::BI__builtin_neon_vmlalltbq_laneq_f32_mf8_fpm:
3333 case NEON::BI__builtin_neon_vmlallttq_lane_f32_mf8_fpm:
3334 case NEON::BI__builtin_neon_vmlallttq_laneq_f32_mf8_fpm:
3335 case NEON::BI__builtin_neon_vamin_f16:
3336 case NEON::BI__builtin_neon_vaminq_f16:
3337 case NEON::BI__builtin_neon_vamin_f32:
3338 case NEON::BI__builtin_neon_vaminq_f32:
3339 case NEON::BI__builtin_neon_vaminq_f64:
3340 case NEON::BI__builtin_neon_vamax_f16:
3341 case NEON::BI__builtin_neon_vamaxq_f16:
3342 case NEON::BI__builtin_neon_vamax_f32:
3343 case NEON::BI__builtin_neon_vamaxq_f32:
3344 case NEON::BI__builtin_neon_vamaxq_f64:
3345 case NEON::BI__builtin_neon_vscale_f16:
3346 case NEON::BI__builtin_neon_vscaleq_f16:
3347 case NEON::BI__builtin_neon_vscale_f32:
3348 case NEON::BI__builtin_neon_vscaleq_f32:
3349 case NEON::BI__builtin_neon_vscaleq_f64:
3350 cgm.errorNYI(
expr->getSourceRange(),
3351 std::string(
"unimplemented AArch64 builtin call: ") +
3352 getContext().BuiltinInfo.getName(builtinID));
3353 return mlir::Value{};