804 if (builtinID == Builtin::BI__builtin_cpu_is) {
805 cgm.errorNYI(
expr->getSourceRange(),
"__builtin_cpu_is");
806 return mlir::Value{};
808 if (builtinID == Builtin::BI__builtin_cpu_supports) {
809 cgm.errorNYI(
expr->getSourceRange(),
"__builtin_cpu_supports");
810 return mlir::Value{};
812 if (builtinID == Builtin::BI__builtin_cpu_init) {
813 cgm.errorNYI(
expr->getSourceRange(),
"__builtin_cpu_init");
814 return mlir::Value{};
829 unsigned iceArguments = 0;
834 for (
auto [idx, arg] : llvm::enumerate(
expr->arguments()))
838 mlir::Type
voidTy = builder.getVoidTy();
843 case X86::BI_mm_clflush:
844 return builder.emitIntrinsicCallOp(
getLoc(
expr->getExprLoc()),
845 "x86.sse2.clflush",
voidTy, ops[0]);
846 case X86::BI_mm_lfence:
847 return builder.emitIntrinsicCallOp(
getLoc(
expr->getExprLoc()),
848 "x86.sse2.lfence",
voidTy);
849 case X86::BI_mm_pause:
850 return builder.emitIntrinsicCallOp(
getLoc(
expr->getExprLoc()),
851 "x86.sse2.pause",
voidTy);
852 case X86::BI_mm_mfence:
853 return builder.emitIntrinsicCallOp(
getLoc(
expr->getExprLoc()),
854 "x86.sse2.mfence",
voidTy);
855 case X86::BI_mm_sfence:
856 return builder.emitIntrinsicCallOp(
getLoc(
expr->getExprLoc()),
857 "x86.sse.sfence",
voidTy);
858 case X86::BI_mm_prefetch:
859 case X86::BI_m_prefetch:
860 case X86::BI_m_prefetchw:
863 return builder.emitIntrinsicCallOp(
getLoc(
expr->getExprLoc()),
"x86.rdtsc",
864 builder.getUInt64Ty());
865 case X86::BI__builtin_ia32_rdtscp: {
866 mlir::Location loc =
getLoc(
expr->getExprLoc());
867 mlir::Type i64Ty = builder.getUInt64Ty();
868 mlir::Type i32Ty = builder.getUInt32Ty();
869 mlir::Type structTy = builder.getAnonRecordTy({i64Ty, i32Ty});
871 builder.emitIntrinsicCallOp(loc,
"x86.rdtscp", structTy);
874 mlir::Value processorId =
875 cir::ExtractMemberOp::create(builder, loc, i32Ty, result, 1);
880 return cir::ExtractMemberOp::create(builder, loc, i64Ty, result, 0);
882 case X86::BI__builtin_ia32_lzcnt_u16:
883 case X86::BI__builtin_ia32_lzcnt_u32:
884 case X86::BI__builtin_ia32_lzcnt_u64: {
885 mlir::Location loc =
getLoc(
expr->getExprLoc());
886 mlir::Value isZeroPoison = builder.getFalse(loc);
887 return builder.emitIntrinsicCallOp(loc,
"ctlz", ops[0].
getType(),
888 mlir::ValueRange{ops[0], isZeroPoison});
890 case X86::BI__builtin_ia32_tzcnt_u16:
891 case X86::BI__builtin_ia32_tzcnt_u32:
892 case X86::BI__builtin_ia32_tzcnt_u64: {
893 mlir::Location loc =
getLoc(
expr->getExprLoc());
894 mlir::Value isZeroPoison = builder.getFalse(loc);
895 return builder.emitIntrinsicCallOp(loc,
"cttz", ops[0].
getType(),
896 mlir::ValueRange{ops[0], isZeroPoison});
898 case X86::BI__builtin_ia32_undef128:
899 case X86::BI__builtin_ia32_undef256:
900 case X86::BI__builtin_ia32_undef512:
908 case X86::BI__builtin_ia32_vec_ext_v4hi:
909 case X86::BI__builtin_ia32_vec_ext_v16qi:
910 case X86::BI__builtin_ia32_vec_ext_v8hi:
911 case X86::BI__builtin_ia32_vec_ext_v4si:
912 case X86::BI__builtin_ia32_vec_ext_v4sf:
913 case X86::BI__builtin_ia32_vec_ext_v2di:
914 case X86::BI__builtin_ia32_vec_ext_v32qi:
915 case X86::BI__builtin_ia32_vec_ext_v16hi:
916 case X86::BI__builtin_ia32_vec_ext_v8si:
917 case X86::BI__builtin_ia32_vec_ext_v4di: {
921 index &= numElts - 1;
923 cir::ConstantOp indexVal =
928 return cir::VecExtractOp::create(builder,
getLoc(
expr->getExprLoc()),
931 case X86::BI__builtin_ia32_vec_set_v4hi:
932 case X86::BI__builtin_ia32_vec_set_v16qi:
933 case X86::BI__builtin_ia32_vec_set_v8hi:
934 case X86::BI__builtin_ia32_vec_set_v4si:
935 case X86::BI__builtin_ia32_vec_set_v2di:
936 case X86::BI__builtin_ia32_vec_set_v32qi:
937 case X86::BI__builtin_ia32_vec_set_v16hi:
938 case X86::BI__builtin_ia32_vec_set_v8si:
939 case X86::BI__builtin_ia32_vec_set_v4di: {
943 case X86::BI__builtin_ia32_kunpckhi:
945 "x86.avx512.kunpackb", ops);
946 case X86::BI__builtin_ia32_kunpcksi:
948 "x86.avx512.kunpackw", ops);
949 case X86::BI__builtin_ia32_kunpckdi:
951 "x86.avx512.kunpackd", ops);
952 case X86::BI_mm_setcsr:
953 case X86::BI__builtin_ia32_ldmxcsr: {
954 mlir::Location loc =
getLoc(
expr->getExprLoc());
956 builder.createStore(loc, ops[0], tmp);
957 return builder.emitIntrinsicCallOp(loc,
"x86.sse.ldmxcsr",
960 case X86::BI_mm_getcsr:
961 case X86::BI__builtin_ia32_stmxcsr: {
962 mlir::Location loc =
getLoc(
expr->getExprLoc());
964 builder.emitIntrinsicCallOp(loc,
"x86.sse.stmxcsr", builder.getVoidTy(),
966 return builder.createLoad(loc, tmp);
968 case X86::BI__builtin_ia32_xsave:
969 case X86::BI__builtin_ia32_xsave64:
970 case X86::BI__builtin_ia32_xrstor:
971 case X86::BI__builtin_ia32_xrstor64:
972 case X86::BI__builtin_ia32_xsaveopt:
973 case X86::BI__builtin_ia32_xsaveopt64:
974 case X86::BI__builtin_ia32_xrstors:
975 case X86::BI__builtin_ia32_xrstors64:
976 case X86::BI__builtin_ia32_xsavec:
977 case X86::BI__builtin_ia32_xsavec64:
978 case X86::BI__builtin_ia32_xsaves:
979 case X86::BI__builtin_ia32_xsaves64:
980 case X86::BI__builtin_ia32_xsetbv:
981 case X86::BI_xsetbv: {
982 mlir::Location loc =
getLoc(
expr->getExprLoc());
983 StringRef intrinsicName;
986 llvm_unreachable(
"Unexpected builtin");
987 case X86::BI__builtin_ia32_xsave:
988 intrinsicName =
"x86.xsave";
990 case X86::BI__builtin_ia32_xsave64:
991 intrinsicName =
"x86.xsave64";
993 case X86::BI__builtin_ia32_xrstor:
994 intrinsicName =
"x86.xrstor";
996 case X86::BI__builtin_ia32_xrstor64:
997 intrinsicName =
"x86.xrstor64";
999 case X86::BI__builtin_ia32_xsaveopt:
1000 intrinsicName =
"x86.xsaveopt";
1002 case X86::BI__builtin_ia32_xsaveopt64:
1003 intrinsicName =
"x86.xsaveopt64";
1005 case X86::BI__builtin_ia32_xrstors:
1006 intrinsicName =
"x86.xrstors";
1008 case X86::BI__builtin_ia32_xrstors64:
1009 intrinsicName =
"x86.xrstors64";
1011 case X86::BI__builtin_ia32_xsavec:
1012 intrinsicName =
"x86.xsavec";
1014 case X86::BI__builtin_ia32_xsavec64:
1015 intrinsicName =
"x86.xsavec64";
1017 case X86::BI__builtin_ia32_xsaves:
1018 intrinsicName =
"x86.xsaves";
1020 case X86::BI__builtin_ia32_xsaves64:
1021 intrinsicName =
"x86.xsaves64";
1023 case X86::BI__builtin_ia32_xsetbv:
1024 case X86::BI_xsetbv:
1025 intrinsicName =
"x86.xsetbv";
1033 mlir::Type i32Ty = builder.getSInt32Ty();
1036 cir::ConstantOp shift32 = builder.getSInt64(32, loc);
1037 mlir::Value mhi = builder.createShift(loc, ops[1], shift32.getResult(),
1039 mhi = builder.createIntCast(mhi, i32Ty);
1042 mlir::Value mlo = builder.createIntCast(ops[1], i32Ty);
1044 return builder.emitIntrinsicCallOp(loc, intrinsicName,
voidTy,
1045 mlir::ValueRange{ops[0], mhi, mlo});
1047 case X86::BI__builtin_ia32_xgetbv:
1048 case X86::BI_xgetbv:
1051 return builder.emitIntrinsicCallOp(
getLoc(
expr->getExprLoc()),
"x86.xgetbv",
1052 builder.getUInt64Ty(), ops[0]);
1053 case X86::BI__builtin_ia32_storedqudi128_mask:
1054 case X86::BI__builtin_ia32_storedqusi128_mask:
1055 case X86::BI__builtin_ia32_storedquhi128_mask:
1056 case X86::BI__builtin_ia32_storedquqi128_mask:
1057 case X86::BI__builtin_ia32_storeupd128_mask:
1058 case X86::BI__builtin_ia32_storeups128_mask:
1059 case X86::BI__builtin_ia32_storedqudi256_mask:
1060 case X86::BI__builtin_ia32_storedqusi256_mask:
1061 case X86::BI__builtin_ia32_storedquhi256_mask:
1062 case X86::BI__builtin_ia32_storedquqi256_mask:
1063 case X86::BI__builtin_ia32_storeupd256_mask:
1064 case X86::BI__builtin_ia32_storeups256_mask:
1065 case X86::BI__builtin_ia32_storedqudi512_mask:
1066 case X86::BI__builtin_ia32_storedqusi512_mask:
1067 case X86::BI__builtin_ia32_storedquhi512_mask:
1068 case X86::BI__builtin_ia32_storedquqi512_mask:
1069 case X86::BI__builtin_ia32_storeupd512_mask:
1070 case X86::BI__builtin_ia32_storeups512_mask:
1071 case X86::BI__builtin_ia32_storesbf16128_mask:
1072 case X86::BI__builtin_ia32_storesh128_mask:
1073 case X86::BI__builtin_ia32_storess128_mask:
1074 case X86::BI__builtin_ia32_storesd128_mask:
1075 cgm.errorNYI(
expr->getSourceRange(),
1076 std::string(
"unimplemented x86 builtin call: ") +
1077 getContext().BuiltinInfo.getName(builtinID));
1078 return mlir::Value{};
1079 case X86::BI__builtin_ia32_cvtmask2b128:
1080 case X86::BI__builtin_ia32_cvtmask2b256:
1081 case X86::BI__builtin_ia32_cvtmask2b512:
1082 case X86::BI__builtin_ia32_cvtmask2w128:
1083 case X86::BI__builtin_ia32_cvtmask2w256:
1084 case X86::BI__builtin_ia32_cvtmask2w512:
1085 case X86::BI__builtin_ia32_cvtmask2d128:
1086 case X86::BI__builtin_ia32_cvtmask2d256:
1087 case X86::BI__builtin_ia32_cvtmask2d512:
1088 case X86::BI__builtin_ia32_cvtmask2q128:
1089 case X86::BI__builtin_ia32_cvtmask2q256:
1090 case X86::BI__builtin_ia32_cvtmask2q512:
1094 case X86::BI__builtin_ia32_cvtb2mask128:
1095 case X86::BI__builtin_ia32_cvtb2mask256:
1096 case X86::BI__builtin_ia32_cvtb2mask512:
1097 case X86::BI__builtin_ia32_cvtw2mask128:
1098 case X86::BI__builtin_ia32_cvtw2mask256:
1099 case X86::BI__builtin_ia32_cvtw2mask512:
1100 case X86::BI__builtin_ia32_cvtd2mask128:
1101 case X86::BI__builtin_ia32_cvtd2mask256:
1102 case X86::BI__builtin_ia32_cvtd2mask512:
1103 case X86::BI__builtin_ia32_cvtq2mask128:
1104 case X86::BI__builtin_ia32_cvtq2mask256:
1105 case X86::BI__builtin_ia32_cvtq2mask512:
1108 case X86::BI__builtin_ia32_cvtdq2ps512_mask:
1109 case X86::BI__builtin_ia32_cvtqq2ps512_mask:
1110 case X86::BI__builtin_ia32_cvtqq2pd512_mask:
1111 case X86::BI__builtin_ia32_vcvtw2ph512_mask:
1112 case X86::BI__builtin_ia32_vcvtdq2ph512_mask:
1113 case X86::BI__builtin_ia32_vcvtqq2ph512_mask:
1114 case X86::BI__builtin_ia32_cvtudq2ps512_mask:
1115 case X86::BI__builtin_ia32_cvtuqq2ps512_mask:
1116 case X86::BI__builtin_ia32_cvtuqq2pd512_mask:
1117 case X86::BI__builtin_ia32_vcvtuw2ph512_mask:
1118 case X86::BI__builtin_ia32_vcvtudq2ph512_mask:
1119 case X86::BI__builtin_ia32_vcvtuqq2ph512_mask:
1120 case X86::BI__builtin_ia32_vfmaddsh3_mask:
1121 case X86::BI__builtin_ia32_vfmaddss3_mask:
1122 case X86::BI__builtin_ia32_vfmaddsd3_mask:
1123 case X86::BI__builtin_ia32_vfmaddsh3_maskz:
1124 case X86::BI__builtin_ia32_vfmaddss3_maskz:
1125 case X86::BI__builtin_ia32_vfmaddsd3_maskz:
1126 case X86::BI__builtin_ia32_vfmaddsh3_mask3:
1127 case X86::BI__builtin_ia32_vfmaddss3_mask3:
1128 case X86::BI__builtin_ia32_vfmaddsd3_mask3:
1129 case X86::BI__builtin_ia32_vfmsubsh3_mask3:
1130 case X86::BI__builtin_ia32_vfmsubss3_mask3:
1131 case X86::BI__builtin_ia32_vfmsubsd3_mask3:
1132 case X86::BI__builtin_ia32_vfmaddph512_mask:
1133 case X86::BI__builtin_ia32_vfmaddph512_maskz:
1134 case X86::BI__builtin_ia32_vfmaddph512_mask3:
1135 case X86::BI__builtin_ia32_vfmaddps512_mask:
1136 case X86::BI__builtin_ia32_vfmaddps512_maskz:
1137 case X86::BI__builtin_ia32_vfmaddps512_mask3:
1138 case X86::BI__builtin_ia32_vfmsubps512_mask3:
1139 case X86::BI__builtin_ia32_vfmaddpd512_mask:
1140 case X86::BI__builtin_ia32_vfmaddpd512_maskz:
1141 case X86::BI__builtin_ia32_vfmaddpd512_mask3:
1142 case X86::BI__builtin_ia32_vfmsubpd512_mask3:
1143 case X86::BI__builtin_ia32_vfmsubph512_mask3:
1144 case X86::BI__builtin_ia32_vfmaddsubph512_mask:
1145 case X86::BI__builtin_ia32_vfmaddsubph512_maskz:
1146 case X86::BI__builtin_ia32_vfmaddsubph512_mask3:
1147 case X86::BI__builtin_ia32_vfmsubaddph512_mask3:
1148 case X86::BI__builtin_ia32_vfmaddsubps512_mask:
1149 case X86::BI__builtin_ia32_vfmaddsubps512_maskz:
1150 case X86::BI__builtin_ia32_vfmaddsubps512_mask3:
1151 case X86::BI__builtin_ia32_vfmsubaddps512_mask3:
1152 case X86::BI__builtin_ia32_vfmaddsubpd512_mask:
1153 case X86::BI__builtin_ia32_vfmaddsubpd512_maskz:
1154 case X86::BI__builtin_ia32_vfmaddsubpd512_mask3:
1155 case X86::BI__builtin_ia32_vfmsubaddpd512_mask3:
1156 case X86::BI__builtin_ia32_movdqa32store128_mask:
1157 case X86::BI__builtin_ia32_movdqa64store128_mask:
1158 case X86::BI__builtin_ia32_storeaps128_mask:
1159 case X86::BI__builtin_ia32_storeapd128_mask:
1160 case X86::BI__builtin_ia32_movdqa32store256_mask:
1161 case X86::BI__builtin_ia32_movdqa64store256_mask:
1162 case X86::BI__builtin_ia32_storeaps256_mask:
1163 case X86::BI__builtin_ia32_storeapd256_mask:
1164 case X86::BI__builtin_ia32_movdqa32store512_mask:
1165 case X86::BI__builtin_ia32_movdqa64store512_mask:
1166 case X86::BI__builtin_ia32_storeaps512_mask:
1167 case X86::BI__builtin_ia32_storeapd512_mask:
1168 cgm.errorNYI(
expr->getSourceRange(),
1169 std::string(
"unimplemented X86 builtin call: ") +
1170 getContext().BuiltinInfo.getName(builtinID));
1173 case X86::BI__builtin_ia32_loadups128_mask:
1174 case X86::BI__builtin_ia32_loadups256_mask:
1175 case X86::BI__builtin_ia32_loadups512_mask:
1176 case X86::BI__builtin_ia32_loadupd128_mask:
1177 case X86::BI__builtin_ia32_loadupd256_mask:
1178 case X86::BI__builtin_ia32_loadupd512_mask:
1179 case X86::BI__builtin_ia32_loaddquqi128_mask:
1180 case X86::BI__builtin_ia32_loaddquqi256_mask:
1181 case X86::BI__builtin_ia32_loaddquqi512_mask:
1182 case X86::BI__builtin_ia32_loaddquhi128_mask:
1183 case X86::BI__builtin_ia32_loaddquhi256_mask:
1184 case X86::BI__builtin_ia32_loaddquhi512_mask:
1185 case X86::BI__builtin_ia32_loaddqusi128_mask:
1186 case X86::BI__builtin_ia32_loaddqusi256_mask:
1187 case X86::BI__builtin_ia32_loaddqusi512_mask:
1188 case X86::BI__builtin_ia32_loaddqudi128_mask:
1189 case X86::BI__builtin_ia32_loaddqudi256_mask:
1190 case X86::BI__builtin_ia32_loaddqudi512_mask:
1191 case X86::BI__builtin_ia32_loadsbf16128_mask:
1192 case X86::BI__builtin_ia32_loadsh128_mask:
1193 case X86::BI__builtin_ia32_loadss128_mask:
1194 case X86::BI__builtin_ia32_loadsd128_mask:
1198 case X86::BI__builtin_ia32_loadaps128_mask:
1199 case X86::BI__builtin_ia32_loadaps256_mask:
1200 case X86::BI__builtin_ia32_loadaps512_mask:
1201 case X86::BI__builtin_ia32_loadapd128_mask:
1202 case X86::BI__builtin_ia32_loadapd256_mask:
1203 case X86::BI__builtin_ia32_loadapd512_mask:
1204 case X86::BI__builtin_ia32_movdqa32load128_mask:
1205 case X86::BI__builtin_ia32_movdqa32load256_mask:
1206 case X86::BI__builtin_ia32_movdqa32load512_mask:
1207 case X86::BI__builtin_ia32_movdqa64load128_mask:
1208 case X86::BI__builtin_ia32_movdqa64load256_mask:
1209 case X86::BI__builtin_ia32_movdqa64load512_mask:
1213 .getTypeAlignInChars(
expr->getArg(1)->getType())
1217 case X86::BI__builtin_ia32_expandloaddf128_mask:
1218 case X86::BI__builtin_ia32_expandloaddf256_mask:
1219 case X86::BI__builtin_ia32_expandloaddf512_mask:
1220 case X86::BI__builtin_ia32_expandloadsf128_mask:
1221 case X86::BI__builtin_ia32_expandloadsf256_mask:
1222 case X86::BI__builtin_ia32_expandloadsf512_mask:
1223 case X86::BI__builtin_ia32_expandloaddi128_mask:
1224 case X86::BI__builtin_ia32_expandloaddi256_mask:
1225 case X86::BI__builtin_ia32_expandloaddi512_mask:
1226 case X86::BI__builtin_ia32_expandloadsi128_mask:
1227 case X86::BI__builtin_ia32_expandloadsi256_mask:
1228 case X86::BI__builtin_ia32_expandloadsi512_mask:
1229 case X86::BI__builtin_ia32_expandloadhi128_mask:
1230 case X86::BI__builtin_ia32_expandloadhi256_mask:
1231 case X86::BI__builtin_ia32_expandloadhi512_mask:
1232 case X86::BI__builtin_ia32_expandloadqi128_mask:
1233 case X86::BI__builtin_ia32_expandloadqi256_mask:
1234 case X86::BI__builtin_ia32_expandloadqi512_mask:
1235 case X86::BI__builtin_ia32_compressstoredf128_mask:
1236 case X86::BI__builtin_ia32_compressstoredf256_mask:
1237 case X86::BI__builtin_ia32_compressstoredf512_mask:
1238 case X86::BI__builtin_ia32_compressstoresf128_mask:
1239 case X86::BI__builtin_ia32_compressstoresf256_mask:
1240 case X86::BI__builtin_ia32_compressstoresf512_mask:
1241 case X86::BI__builtin_ia32_compressstoredi128_mask:
1242 case X86::BI__builtin_ia32_compressstoredi256_mask:
1243 case X86::BI__builtin_ia32_compressstoredi512_mask:
1244 case X86::BI__builtin_ia32_compressstoresi128_mask:
1245 case X86::BI__builtin_ia32_compressstoresi256_mask:
1246 case X86::BI__builtin_ia32_compressstoresi512_mask:
1247 case X86::BI__builtin_ia32_compressstorehi128_mask:
1248 case X86::BI__builtin_ia32_compressstorehi256_mask:
1249 case X86::BI__builtin_ia32_compressstorehi512_mask:
1250 case X86::BI__builtin_ia32_compressstoreqi128_mask:
1251 case X86::BI__builtin_ia32_compressstoreqi256_mask:
1252 case X86::BI__builtin_ia32_compressstoreqi512_mask:
1253 cgm.errorNYI(
expr->getSourceRange(),
1254 std::string(
"unimplemented X86 builtin call: ") +
1255 getContext().BuiltinInfo.getName(builtinID));
1256 return mlir::Value{};
1257 case X86::BI__builtin_ia32_expanddf128_mask:
1258 case X86::BI__builtin_ia32_expanddf256_mask:
1259 case X86::BI__builtin_ia32_expanddf512_mask:
1260 case X86::BI__builtin_ia32_expandsf128_mask:
1261 case X86::BI__builtin_ia32_expandsf256_mask:
1262 case X86::BI__builtin_ia32_expandsf512_mask:
1263 case X86::BI__builtin_ia32_expanddi128_mask:
1264 case X86::BI__builtin_ia32_expanddi256_mask:
1265 case X86::BI__builtin_ia32_expanddi512_mask:
1266 case X86::BI__builtin_ia32_expandsi128_mask:
1267 case X86::BI__builtin_ia32_expandsi256_mask:
1268 case X86::BI__builtin_ia32_expandsi512_mask:
1269 case X86::BI__builtin_ia32_expandhi128_mask:
1270 case X86::BI__builtin_ia32_expandhi256_mask:
1271 case X86::BI__builtin_ia32_expandhi512_mask:
1272 case X86::BI__builtin_ia32_expandqi128_mask:
1273 case X86::BI__builtin_ia32_expandqi256_mask:
1274 case X86::BI__builtin_ia32_expandqi512_mask: {
1275 mlir::Location loc =
getLoc(
expr->getExprLoc());
1277 "x86.avx512.mask.expand");
1279 case X86::BI__builtin_ia32_compressdf128_mask:
1280 case X86::BI__builtin_ia32_compressdf256_mask:
1281 case X86::BI__builtin_ia32_compressdf512_mask:
1282 case X86::BI__builtin_ia32_compresssf128_mask:
1283 case X86::BI__builtin_ia32_compresssf256_mask:
1284 case X86::BI__builtin_ia32_compresssf512_mask:
1285 case X86::BI__builtin_ia32_compressdi128_mask:
1286 case X86::BI__builtin_ia32_compressdi256_mask:
1287 case X86::BI__builtin_ia32_compressdi512_mask:
1288 case X86::BI__builtin_ia32_compresssi128_mask:
1289 case X86::BI__builtin_ia32_compresssi256_mask:
1290 case X86::BI__builtin_ia32_compresssi512_mask:
1291 case X86::BI__builtin_ia32_compresshi128_mask:
1292 case X86::BI__builtin_ia32_compresshi256_mask:
1293 case X86::BI__builtin_ia32_compresshi512_mask:
1294 case X86::BI__builtin_ia32_compressqi128_mask:
1295 case X86::BI__builtin_ia32_compressqi256_mask:
1296 case X86::BI__builtin_ia32_compressqi512_mask: {
1297 mlir::Location loc =
getLoc(
expr->getExprLoc());
1299 "x86.avx512.mask.compress");
1301 case X86::BI__builtin_ia32_gather3div2df:
1302 case X86::BI__builtin_ia32_gather3div2di:
1303 case X86::BI__builtin_ia32_gather3div4df:
1304 case X86::BI__builtin_ia32_gather3div4di:
1305 case X86::BI__builtin_ia32_gather3div4sf:
1306 case X86::BI__builtin_ia32_gather3div4si:
1307 case X86::BI__builtin_ia32_gather3div8sf:
1308 case X86::BI__builtin_ia32_gather3div8si:
1309 case X86::BI__builtin_ia32_gather3siv2df:
1310 case X86::BI__builtin_ia32_gather3siv2di:
1311 case X86::BI__builtin_ia32_gather3siv4df:
1312 case X86::BI__builtin_ia32_gather3siv4di:
1313 case X86::BI__builtin_ia32_gather3siv4sf:
1314 case X86::BI__builtin_ia32_gather3siv4si:
1315 case X86::BI__builtin_ia32_gather3siv8sf:
1316 case X86::BI__builtin_ia32_gather3siv8si:
1317 case X86::BI__builtin_ia32_gathersiv8df:
1318 case X86::BI__builtin_ia32_gathersiv16sf:
1319 case X86::BI__builtin_ia32_gatherdiv8df:
1320 case X86::BI__builtin_ia32_gatherdiv16sf:
1321 case X86::BI__builtin_ia32_gathersiv8di:
1322 case X86::BI__builtin_ia32_gathersiv16si:
1323 case X86::BI__builtin_ia32_gatherdiv8di:
1324 case X86::BI__builtin_ia32_gatherdiv16si: {
1325 StringRef intrinsicName;
1326 switch (builtinID) {
1328 llvm_unreachable(
"Unexpected builtin");
1329 case X86::BI__builtin_ia32_gather3div2df:
1330 intrinsicName =
"x86.avx512.mask.gather3div2.df";
1332 case X86::BI__builtin_ia32_gather3div2di:
1333 intrinsicName =
"x86.avx512.mask.gather3div2.di";
1335 case X86::BI__builtin_ia32_gather3div4df:
1336 intrinsicName =
"x86.avx512.mask.gather3div4.df";
1338 case X86::BI__builtin_ia32_gather3div4di:
1339 intrinsicName =
"x86.avx512.mask.gather3div4.di";
1341 case X86::BI__builtin_ia32_gather3div4sf:
1342 intrinsicName =
"x86.avx512.mask.gather3div4.sf";
1344 case X86::BI__builtin_ia32_gather3div4si:
1345 intrinsicName =
"x86.avx512.mask.gather3div4.si";
1347 case X86::BI__builtin_ia32_gather3div8sf:
1348 intrinsicName =
"x86.avx512.mask.gather3div8.sf";
1350 case X86::BI__builtin_ia32_gather3div8si:
1351 intrinsicName =
"x86.avx512.mask.gather3div8.si";
1353 case X86::BI__builtin_ia32_gather3siv2df:
1354 intrinsicName =
"x86.avx512.mask.gather3siv2.df";
1356 case X86::BI__builtin_ia32_gather3siv2di:
1357 intrinsicName =
"x86.avx512.mask.gather3siv2.di";
1359 case X86::BI__builtin_ia32_gather3siv4df:
1360 intrinsicName =
"x86.avx512.mask.gather3siv4.df";
1362 case X86::BI__builtin_ia32_gather3siv4di:
1363 intrinsicName =
"x86.avx512.mask.gather3siv4.di";
1365 case X86::BI__builtin_ia32_gather3siv4sf:
1366 intrinsicName =
"x86.avx512.mask.gather3siv4.sf";
1368 case X86::BI__builtin_ia32_gather3siv4si:
1369 intrinsicName =
"x86.avx512.mask.gather3siv4.si";
1371 case X86::BI__builtin_ia32_gather3siv8sf:
1372 intrinsicName =
"x86.avx512.mask.gather3siv8.sf";
1374 case X86::BI__builtin_ia32_gather3siv8si:
1375 intrinsicName =
"x86.avx512.mask.gather3siv8.si";
1377 case X86::BI__builtin_ia32_gathersiv8df:
1378 intrinsicName =
"x86.avx512.mask.gather.dpd.512";
1380 case X86::BI__builtin_ia32_gathersiv16sf:
1381 intrinsicName =
"x86.avx512.mask.gather.dps.512";
1383 case X86::BI__builtin_ia32_gatherdiv8df:
1384 intrinsicName =
"x86.avx512.mask.gather.qpd.512";
1386 case X86::BI__builtin_ia32_gatherdiv16sf:
1387 intrinsicName =
"x86.avx512.mask.gather.qps.512";
1389 case X86::BI__builtin_ia32_gathersiv8di:
1390 intrinsicName =
"x86.avx512.mask.gather.dpq.512";
1392 case X86::BI__builtin_ia32_gathersiv16si:
1393 intrinsicName =
"x86.avx512.mask.gather.dpi.512";
1395 case X86::BI__builtin_ia32_gatherdiv8di:
1396 intrinsicName =
"x86.avx512.mask.gather.qpq.512";
1398 case X86::BI__builtin_ia32_gatherdiv16si:
1399 intrinsicName =
"x86.avx512.mask.gather.qpi.512";
1403 mlir::Location loc =
getLoc(
expr->getExprLoc());
1408 return builder.emitIntrinsicCallOp(loc, intrinsicName,
1411 case X86::BI__builtin_ia32_scattersiv8df:
1412 case X86::BI__builtin_ia32_scattersiv16sf:
1413 case X86::BI__builtin_ia32_scatterdiv8df:
1414 case X86::BI__builtin_ia32_scatterdiv16sf:
1415 case X86::BI__builtin_ia32_scattersiv8di:
1416 case X86::BI__builtin_ia32_scattersiv16si:
1417 case X86::BI__builtin_ia32_scatterdiv8di:
1418 case X86::BI__builtin_ia32_scatterdiv16si:
1419 case X86::BI__builtin_ia32_scatterdiv2df:
1420 case X86::BI__builtin_ia32_scatterdiv2di:
1421 case X86::BI__builtin_ia32_scatterdiv4df:
1422 case X86::BI__builtin_ia32_scatterdiv4di:
1423 case X86::BI__builtin_ia32_scatterdiv4sf:
1424 case X86::BI__builtin_ia32_scatterdiv4si:
1425 case X86::BI__builtin_ia32_scatterdiv8sf:
1426 case X86::BI__builtin_ia32_scatterdiv8si:
1427 case X86::BI__builtin_ia32_scattersiv2df:
1428 case X86::BI__builtin_ia32_scattersiv2di:
1429 case X86::BI__builtin_ia32_scattersiv4df:
1430 case X86::BI__builtin_ia32_scattersiv4di:
1431 case X86::BI__builtin_ia32_scattersiv4sf:
1432 case X86::BI__builtin_ia32_scattersiv4si:
1433 case X86::BI__builtin_ia32_scattersiv8sf:
1434 case X86::BI__builtin_ia32_scattersiv8si: {
1435 llvm::StringRef intrinsicName;
1436 switch (builtinID) {
1438 llvm_unreachable(
"Unexpected builtin");
1439 case X86::BI__builtin_ia32_scattersiv8df:
1440 intrinsicName =
"x86.avx512.mask.scatter.dpd.512";
1442 case X86::BI__builtin_ia32_scattersiv16sf:
1443 intrinsicName =
"x86.avx512.mask.scatter.dps.512";
1445 case X86::BI__builtin_ia32_scatterdiv8df:
1446 intrinsicName =
"x86.avx512.mask.scatter.qpd.512";
1448 case X86::BI__builtin_ia32_scatterdiv16sf:
1449 intrinsicName =
"x86.avx512.mask.scatter.qps.512";
1451 case X86::BI__builtin_ia32_scattersiv8di:
1452 intrinsicName =
"x86.avx512.mask.scatter.dpq.512";
1454 case X86::BI__builtin_ia32_scattersiv16si:
1455 intrinsicName =
"x86.avx512.mask.scatter.dpi.512";
1457 case X86::BI__builtin_ia32_scatterdiv8di:
1458 intrinsicName =
"x86.avx512.mask.scatter.qpq.512";
1460 case X86::BI__builtin_ia32_scatterdiv16si:
1461 intrinsicName =
"x86.avx512.mask.scatter.qpi.512";
1463 case X86::BI__builtin_ia32_scatterdiv2df:
1464 intrinsicName =
"x86.avx512.mask.scatterdiv2.df";
1466 case X86::BI__builtin_ia32_scatterdiv2di:
1467 intrinsicName =
"x86.avx512.mask.scatterdiv2.di";
1469 case X86::BI__builtin_ia32_scatterdiv4df:
1470 intrinsicName =
"x86.avx512.mask.scatterdiv4.df";
1472 case X86::BI__builtin_ia32_scatterdiv4di:
1473 intrinsicName =
"x86.avx512.mask.scatterdiv4.di";
1475 case X86::BI__builtin_ia32_scatterdiv4sf:
1476 intrinsicName =
"x86.avx512.mask.scatterdiv4.sf";
1478 case X86::BI__builtin_ia32_scatterdiv4si:
1479 intrinsicName =
"x86.avx512.mask.scatterdiv4.si";
1481 case X86::BI__builtin_ia32_scatterdiv8sf:
1482 intrinsicName =
"x86.avx512.mask.scatterdiv8.sf";
1484 case X86::BI__builtin_ia32_scatterdiv8si:
1485 intrinsicName =
"x86.avx512.mask.scatterdiv8.si";
1487 case X86::BI__builtin_ia32_scattersiv2df:
1488 intrinsicName =
"x86.avx512.mask.scattersiv2.df";
1490 case X86::BI__builtin_ia32_scattersiv2di:
1491 intrinsicName =
"x86.avx512.mask.scattersiv2.di";
1493 case X86::BI__builtin_ia32_scattersiv4df:
1494 intrinsicName =
"x86.avx512.mask.scattersiv4.df";
1496 case X86::BI__builtin_ia32_scattersiv4di:
1497 intrinsicName =
"x86.avx512.mask.scattersiv4.di";
1499 case X86::BI__builtin_ia32_scattersiv4sf:
1500 intrinsicName =
"x86.avx512.mask.scattersiv4.sf";
1502 case X86::BI__builtin_ia32_scattersiv4si:
1503 intrinsicName =
"x86.avx512.mask.scattersiv4.si";
1505 case X86::BI__builtin_ia32_scattersiv8sf:
1506 intrinsicName =
"x86.avx512.mask.scattersiv8.sf";
1508 case X86::BI__builtin_ia32_scattersiv8si:
1509 intrinsicName =
"x86.avx512.mask.scattersiv8.si";
1513 mlir::Location loc =
getLoc(
expr->getExprLoc());
1519 return builder.emitIntrinsicCallOp(loc, intrinsicName,
1522 case X86::BI__builtin_ia32_vextractf128_pd256:
1523 case X86::BI__builtin_ia32_vextractf128_ps256:
1524 case X86::BI__builtin_ia32_vextractf128_si256:
1525 case X86::BI__builtin_ia32_extract128i256:
1526 case X86::BI__builtin_ia32_extractf64x4_mask:
1527 case X86::BI__builtin_ia32_extractf32x4_mask:
1528 case X86::BI__builtin_ia32_extracti64x4_mask:
1529 case X86::BI__builtin_ia32_extracti32x4_mask:
1530 case X86::BI__builtin_ia32_extractf32x8_mask:
1531 case X86::BI__builtin_ia32_extracti32x8_mask:
1532 case X86::BI__builtin_ia32_extractf32x4_256_mask:
1533 case X86::BI__builtin_ia32_extracti32x4_256_mask:
1534 case X86::BI__builtin_ia32_extractf64x2_256_mask:
1535 case X86::BI__builtin_ia32_extracti64x2_256_mask:
1536 case X86::BI__builtin_ia32_extractf64x2_512_mask:
1537 case X86::BI__builtin_ia32_extracti64x2_512_mask: {
1538 mlir::Location loc =
getLoc(
expr->getExprLoc());
1540 unsigned numElts = dstTy.getSize();
1542 unsigned subVectors = srcNumElts / numElts;
1543 assert(llvm::isPowerOf2_32(subVectors) &&
"Expected power of 2 subvectors");
1545 ops[1].getDefiningOp<cir::ConstantOp>().getIntValue().getZExtValue();
1547 index &= subVectors - 1;
1550 int64_t indices[16];
1551 std::iota(indices, indices + numElts,
index);
1553 mlir::Value poison =
1554 builder.getConstant(loc, cir::PoisonAttr::get(ops[0].
getType()));
1555 mlir::Value res = builder.createVecShuffle(loc, ops[0], poison,
1557 if (ops.size() == 4)
1562 case X86::BI__builtin_ia32_vinsertf128_pd256:
1563 case X86::BI__builtin_ia32_vinsertf128_ps256:
1564 case X86::BI__builtin_ia32_vinsertf128_si256:
1565 case X86::BI__builtin_ia32_insert128i256:
1566 case X86::BI__builtin_ia32_insertf64x4:
1567 case X86::BI__builtin_ia32_insertf32x4:
1568 case X86::BI__builtin_ia32_inserti64x4:
1569 case X86::BI__builtin_ia32_inserti32x4:
1570 case X86::BI__builtin_ia32_insertf32x8:
1571 case X86::BI__builtin_ia32_inserti32x8:
1572 case X86::BI__builtin_ia32_insertf32x4_256:
1573 case X86::BI__builtin_ia32_inserti32x4_256:
1574 case X86::BI__builtin_ia32_insertf64x2_256:
1575 case X86::BI__builtin_ia32_inserti64x2_256:
1576 case X86::BI__builtin_ia32_insertf64x2_512:
1577 case X86::BI__builtin_ia32_inserti64x2_512: {
1580 unsigned subVectors = dstNumElts / srcNumElts;
1581 assert(llvm::isPowerOf2_32(subVectors) &&
"Expected power of 2 subvectors");
1582 assert(dstNumElts <= 16);
1585 index &= subVectors - 1;
1586 index *= srcNumElts;
1589 for (
unsigned i = 0; i != dstNumElts; ++i)
1590 mask[i] = (i >= srcNumElts) ? srcNumElts + (i % srcNumElts) : i;
1593 builder.createVecShuffle(
getLoc(
expr->getExprLoc()), ops[1], mask);
1595 for (
unsigned i = 0; i != dstNumElts; ++i) {
1597 mask[i] = (i -
index) + dstNumElts;
1602 return builder.createVecShuffle(
getLoc(
expr->getExprLoc()), ops[0], op1,
1605 case X86::BI__builtin_ia32_pmovqd512_mask:
1606 case X86::BI__builtin_ia32_pmovwb512_mask: {
1612 case X86::BI__builtin_ia32_pblendw128:
1613 case X86::BI__builtin_ia32_blendpd:
1614 case X86::BI__builtin_ia32_blendps:
1615 case X86::BI__builtin_ia32_blendpd256:
1616 case X86::BI__builtin_ia32_blendps256:
1617 case X86::BI__builtin_ia32_pblendw256:
1618 case X86::BI__builtin_ia32_pblendd128:
1619 case X86::BI__builtin_ia32_pblendd256: {
1626 mlir::Type i32Ty = builder.getSInt32Ty();
1627 for (
unsigned i = 0; i != numElts; ++i)
1629 cir::IntAttr::get(i32Ty, ((imm >> (i % 8)) & 0x1) ? numElts + i : i));
1631 return builder.createVecShuffle(
getLoc(
expr->getExprLoc()), ops[0], ops[1],
1634 case X86::BI__builtin_ia32_pshuflw:
1635 case X86::BI__builtin_ia32_pshuflw256:
1636 case X86::BI__builtin_ia32_pshuflw512:
1639 case X86::BI__builtin_ia32_pshufhw:
1640 case X86::BI__builtin_ia32_pshufhw256:
1641 case X86::BI__builtin_ia32_pshufhw512:
1644 case X86::BI__builtin_ia32_pshufd:
1645 case X86::BI__builtin_ia32_pshufd256:
1646 case X86::BI__builtin_ia32_pshufd512:
1647 case X86::BI__builtin_ia32_vpermilpd:
1648 case X86::BI__builtin_ia32_vpermilps:
1649 case X86::BI__builtin_ia32_vpermilpd256:
1650 case X86::BI__builtin_ia32_vpermilps256:
1651 case X86::BI__builtin_ia32_vpermilpd512:
1652 case X86::BI__builtin_ia32_vpermilps512: {
1658 return builder.createVecShuffle(
getLoc(
expr->getExprLoc()), ops[0], mask);
1660 case X86::BI__builtin_ia32_shufpd:
1661 case X86::BI__builtin_ia32_shufpd256:
1662 case X86::BI__builtin_ia32_shufpd512:
1663 case X86::BI__builtin_ia32_shufps:
1664 case X86::BI__builtin_ia32_shufps256:
1665 case X86::BI__builtin_ia32_shufps512: {
1671 return builder.createVecShuffle(
getLoc(
expr->getExprLoc()), ops[0], ops[1],
1674 case X86::BI__builtin_ia32_permdi256:
1675 case X86::BI__builtin_ia32_permdf256:
1676 case X86::BI__builtin_ia32_permdi512:
1677 case X86::BI__builtin_ia32_permdf512: {
1679 ops[1].getDefiningOp<cir::ConstantOp>().getIntValue().getZExtValue();
1685 for (
unsigned l = 0; l != numElts; l += 4)
1686 for (
unsigned i = 0; i != 4; ++i)
1687 Indices[l + i] = l + ((imm >> (2 * i)) & 0x3);
1689 return builder.createVecShuffle(
getLoc(
expr->getExprLoc()), ops[0],
1692 case X86::BI__builtin_ia32_palignr128:
1693 case X86::BI__builtin_ia32_palignr256:
1694 case X86::BI__builtin_ia32_palignr512: {
1698 assert(numElts % 16 == 0);
1708 if (shiftVal > 16) {
1715 int64_t indices[64];
1717 for (
unsigned l = 0; l != numElts; l += 16) {
1718 for (
unsigned i = 0; i != 16; ++i) {
1719 uint32_t idx = shiftVal + i;
1721 idx += numElts - 16;
1722 indices[l + i] = l + idx;
1726 return builder.createVecShuffle(
getLoc(
expr->getExprLoc()), ops[1], ops[0],
1729 case X86::BI__builtin_ia32_alignd128:
1730 case X86::BI__builtin_ia32_alignd256:
1731 case X86::BI__builtin_ia32_alignd512:
1732 case X86::BI__builtin_ia32_alignq128:
1733 case X86::BI__builtin_ia32_alignq256:
1734 case X86::BI__builtin_ia32_alignq512: {
1737 ops[2].getDefiningOp<cir::ConstantOp>().getIntValue().getZExtValue() &
1741 shiftVal &= numElts - 1;
1744 mlir::Type i32Ty = builder.getSInt32Ty();
1745 for (
unsigned i = 0; i != numElts; ++i)
1746 indices.push_back(cir::IntAttr::get(i32Ty, i + shiftVal));
1748 return builder.createVecShuffle(
getLoc(
expr->getExprLoc()), ops[0], ops[1],
1751 case X86::BI__builtin_ia32_shuf_f32x4_256:
1752 case X86::BI__builtin_ia32_shuf_f64x2_256:
1753 case X86::BI__builtin_ia32_shuf_i32x4_256:
1754 case X86::BI__builtin_ia32_shuf_i64x2_256:
1755 case X86::BI__builtin_ia32_shuf_f32x4:
1756 case X86::BI__builtin_ia32_shuf_f64x2:
1757 case X86::BI__builtin_ia32_shuf_i32x4:
1758 case X86::BI__builtin_ia32_shuf_i64x2: {
1759 mlir::Value src1 = ops[0];
1760 mlir::Value src2 = ops[1];
1763 ops[2].getDefiningOp<cir::ConstantOp>().getIntValue().getZExtValue();
1767 unsigned numLanes = totalBits == 512 ? 4 : 2;
1768 unsigned numElemsPerLane = numElems / numLanes;
1771 mlir::Type i32Ty = builder.getSInt32Ty();
1773 for (
unsigned l = 0; l != numElems; l += numElemsPerLane) {
1774 unsigned index = (imm % numLanes) * numElemsPerLane;
1776 if (l >= (numElems / 2))
1778 for (
unsigned i = 0; i != numElemsPerLane; ++i) {
1779 indices.push_back(cir::IntAttr::get(i32Ty,
index + i));
1783 return builder.createVecShuffle(
getLoc(
expr->getExprLoc()), src1, src2,
1786 case X86::BI__builtin_ia32_vperm2f128_pd256:
1787 case X86::BI__builtin_ia32_vperm2f128_ps256:
1788 case X86::BI__builtin_ia32_vperm2f128_si256:
1789 case X86::BI__builtin_ia32_permti256:
1790 case X86::BI__builtin_ia32_pslldqi128_byteshift:
1791 case X86::BI__builtin_ia32_pslldqi256_byteshift:
1792 case X86::BI__builtin_ia32_pslldqi512_byteshift:
1793 case X86::BI__builtin_ia32_psrldqi128_byteshift:
1794 case X86::BI__builtin_ia32_psrldqi256_byteshift:
1795 case X86::BI__builtin_ia32_psrldqi512_byteshift:
1796 cgm.errorNYI(
expr->getSourceRange(),
1797 std::string(
"unimplemented X86 builtin call: ") +
1798 getContext().BuiltinInfo.getName(builtinID));
1799 return mlir::Value{};
1800 case X86::BI__builtin_ia32_kshiftliqi:
1801 case X86::BI__builtin_ia32_kshiftlihi:
1802 case X86::BI__builtin_ia32_kshiftlisi:
1803 case X86::BI__builtin_ia32_kshiftlidi: {
1804 mlir::Location loc =
getLoc(
expr->getExprLoc());
1806 ops[1].getDefiningOp<cir::ConstantOp>().getIntValue().getZExtValue() &
1810 if (shiftVal >= numElems)
1811 return builder.getNullValue(ops[0].
getType(), loc);
1816 mlir::Type i32Ty = builder.getSInt32Ty();
1817 for (
auto i : llvm::seq<unsigned>(0, numElems))
1818 indices.push_back(cir::IntAttr::get(i32Ty, numElems + i - shiftVal));
1820 mlir::Value zero = builder.getNullValue(
in.getType(), loc);
1821 mlir::Value sv = builder.createVecShuffle(loc, zero,
in, indices);
1822 return builder.createBitcast(sv, ops[0].
getType());
1824 case X86::BI__builtin_ia32_kshiftriqi:
1825 case X86::BI__builtin_ia32_kshiftrihi:
1826 case X86::BI__builtin_ia32_kshiftrisi:
1827 case X86::BI__builtin_ia32_kshiftridi: {
1828 mlir::Location loc =
getLoc(
expr->getExprLoc());
1830 ops[1].getDefiningOp<cir::ConstantOp>().getIntValue().getZExtValue() &
1834 if (shiftVal >= numElems)
1835 return builder.getNullValue(ops[0].
getType(), loc);
1840 mlir::Type i32Ty = builder.getSInt32Ty();
1841 for (
auto i : llvm::seq<unsigned>(0, numElems))
1842 indices.push_back(cir::IntAttr::get(i32Ty, i + shiftVal));
1844 mlir::Value zero = builder.getNullValue(
in.getType(), loc);
1845 mlir::Value sv = builder.createVecShuffle(loc,
in, zero, indices);
1846 return builder.createBitcast(sv, ops[0].
getType());
1848 case X86::BI__builtin_ia32_vprotbi:
1849 case X86::BI__builtin_ia32_vprotwi:
1850 case X86::BI__builtin_ia32_vprotdi:
1851 case X86::BI__builtin_ia32_vprotqi:
1852 case X86::BI__builtin_ia32_prold128:
1853 case X86::BI__builtin_ia32_prold256:
1854 case X86::BI__builtin_ia32_prold512:
1855 case X86::BI__builtin_ia32_prolq128:
1856 case X86::BI__builtin_ia32_prolq256:
1857 case X86::BI__builtin_ia32_prolq512:
1859 ops[0], ops[1],
false);
1860 case X86::BI__builtin_ia32_prord128:
1861 case X86::BI__builtin_ia32_prord256:
1862 case X86::BI__builtin_ia32_prord512:
1863 case X86::BI__builtin_ia32_prorq128:
1864 case X86::BI__builtin_ia32_prorq256:
1865 case X86::BI__builtin_ia32_prorq512:
1867 ops[0], ops[1],
true);
1868 case X86::BI__builtin_ia32_selectb_128:
1869 case X86::BI__builtin_ia32_selectb_256:
1870 case X86::BI__builtin_ia32_selectb_512:
1871 case X86::BI__builtin_ia32_selectw_128:
1872 case X86::BI__builtin_ia32_selectw_256:
1873 case X86::BI__builtin_ia32_selectw_512:
1874 case X86::BI__builtin_ia32_selectd_128:
1875 case X86::BI__builtin_ia32_selectd_256:
1876 case X86::BI__builtin_ia32_selectd_512:
1877 case X86::BI__builtin_ia32_selectq_128:
1878 case X86::BI__builtin_ia32_selectq_256:
1879 case X86::BI__builtin_ia32_selectq_512:
1880 case X86::BI__builtin_ia32_selectph_128:
1881 case X86::BI__builtin_ia32_selectph_256:
1882 case X86::BI__builtin_ia32_selectph_512:
1883 case X86::BI__builtin_ia32_selectpbf_128:
1884 case X86::BI__builtin_ia32_selectpbf_256:
1885 case X86::BI__builtin_ia32_selectpbf_512:
1886 case X86::BI__builtin_ia32_selectps_128:
1887 case X86::BI__builtin_ia32_selectps_256:
1888 case X86::BI__builtin_ia32_selectps_512:
1889 case X86::BI__builtin_ia32_selectpd_128:
1890 case X86::BI__builtin_ia32_selectpd_256:
1891 case X86::BI__builtin_ia32_selectpd_512:
1894 case X86::BI__builtin_ia32_selectsh_128:
1895 case X86::BI__builtin_ia32_selectsbf_128:
1896 case X86::BI__builtin_ia32_selectss_128:
1897 case X86::BI__builtin_ia32_selectsd_128: {
1898 mlir::Location loc =
getLoc(
expr->getExprLoc());
1899 mlir::Value scalar1 =
1900 builder.createExtractElement(loc, ops[1], uint64_t(0));
1901 mlir::Value scalar2 =
1902 builder.createExtractElement(loc, ops[2], uint64_t(0));
1903 mlir::Value result =
1905 return builder.createInsertElement(loc, ops[1], result, uint64_t(0));
1907 case X86::BI__builtin_ia32_cmpb128_mask:
1908 case X86::BI__builtin_ia32_cmpb256_mask:
1909 case X86::BI__builtin_ia32_cmpb512_mask:
1910 case X86::BI__builtin_ia32_cmpw128_mask:
1911 case X86::BI__builtin_ia32_cmpw256_mask:
1912 case X86::BI__builtin_ia32_cmpw512_mask:
1913 case X86::BI__builtin_ia32_cmpd128_mask:
1914 case X86::BI__builtin_ia32_cmpd256_mask:
1915 case X86::BI__builtin_ia32_cmpd512_mask:
1916 case X86::BI__builtin_ia32_cmpq128_mask:
1917 case X86::BI__builtin_ia32_cmpq256_mask:
1918 case X86::BI__builtin_ia32_cmpq512_mask:
1919 case X86::BI__builtin_ia32_ucmpb128_mask:
1920 case X86::BI__builtin_ia32_ucmpb256_mask:
1921 case X86::BI__builtin_ia32_ucmpb512_mask:
1922 case X86::BI__builtin_ia32_ucmpw128_mask:
1923 case X86::BI__builtin_ia32_ucmpw256_mask:
1924 case X86::BI__builtin_ia32_ucmpw512_mask:
1925 case X86::BI__builtin_ia32_ucmpd128_mask:
1926 case X86::BI__builtin_ia32_ucmpd256_mask:
1927 case X86::BI__builtin_ia32_ucmpd512_mask:
1928 case X86::BI__builtin_ia32_ucmpq128_mask:
1929 case X86::BI__builtin_ia32_ucmpq256_mask:
1930 case X86::BI__builtin_ia32_ucmpq512_mask: {
1935 case X86::BI__builtin_ia32_vpcomb:
1936 case X86::BI__builtin_ia32_vpcomw:
1937 case X86::BI__builtin_ia32_vpcomd:
1938 case X86::BI__builtin_ia32_vpcomq:
1940 case X86::BI__builtin_ia32_vpcomub:
1941 case X86::BI__builtin_ia32_vpcomuw:
1942 case X86::BI__builtin_ia32_vpcomud:
1943 case X86::BI__builtin_ia32_vpcomuq:
1945 case X86::BI__builtin_ia32_kortestcqi:
1946 case X86::BI__builtin_ia32_kortestchi:
1947 case X86::BI__builtin_ia32_kortestcsi:
1948 case X86::BI__builtin_ia32_kortestcdi: {
1949 mlir::Location loc =
getLoc(
expr->getExprLoc());
1951 mlir::Value allOnesOp =
1952 builder.getConstAPInt(loc, ty, APInt::getAllOnes(ty.getWidth()));
1955 cir::CmpOp::create(builder, loc, cir::CmpOpKind::eq, orOp, allOnesOp);
1956 return builder.createCast(cir::CastKind::bool_to_int, cmp,
1957 cgm.convertType(
expr->getType()));
1959 case X86::BI__builtin_ia32_kortestzqi:
1960 case X86::BI__builtin_ia32_kortestzhi:
1961 case X86::BI__builtin_ia32_kortestzsi:
1962 case X86::BI__builtin_ia32_kortestzdi: {
1963 mlir::Location loc =
getLoc(
expr->getExprLoc());
1965 mlir::Value allZerosOp = builder.getNullValue(ty, loc).getResult();
1968 cir::CmpOp::create(builder, loc, cir::CmpOpKind::eq, orOp, allZerosOp);
1969 return builder.createCast(cir::CastKind::bool_to_int, cmp,
1970 cgm.convertType(
expr->getType()));
1972 case X86::BI__builtin_ia32_ktestcqi:
1974 "x86.avx512.ktestc.b", ops);
1975 case X86::BI__builtin_ia32_ktestzqi:
1977 "x86.avx512.ktestz.b", ops);
1978 case X86::BI__builtin_ia32_ktestchi:
1980 "x86.avx512.ktestc.w", ops);
1981 case X86::BI__builtin_ia32_ktestzhi:
1983 "x86.avx512.ktestz.w", ops);
1984 case X86::BI__builtin_ia32_ktestcsi:
1986 "x86.avx512.ktestc.d", ops);
1987 case X86::BI__builtin_ia32_ktestzsi:
1989 "x86.avx512.ktestz.d", ops);
1990 case X86::BI__builtin_ia32_ktestcdi:
1992 "x86.avx512.ktestc.q", ops);
1993 case X86::BI__builtin_ia32_ktestzdi:
1995 "x86.avx512.ktestz.q", ops);
1996 case X86::BI__builtin_ia32_kaddqi:
1998 "x86.avx512.kadd.b", ops);
1999 case X86::BI__builtin_ia32_kaddhi:
2001 "x86.avx512.kadd.w", ops);
2002 case X86::BI__builtin_ia32_kaddsi:
2004 "x86.avx512.kadd.d", ops);
2005 case X86::BI__builtin_ia32_kadddi:
2007 "x86.avx512.kadd.q", ops);
2008 case X86::BI__builtin_ia32_kandqi:
2009 case X86::BI__builtin_ia32_kandhi:
2010 case X86::BI__builtin_ia32_kandsi:
2011 case X86::BI__builtin_ia32_kanddi:
2014 case X86::BI__builtin_ia32_kandnqi:
2015 case X86::BI__builtin_ia32_kandnhi:
2016 case X86::BI__builtin_ia32_kandnsi:
2017 case X86::BI__builtin_ia32_kandndi:
2020 case X86::BI__builtin_ia32_korqi:
2021 case X86::BI__builtin_ia32_korhi:
2022 case X86::BI__builtin_ia32_korsi:
2023 case X86::BI__builtin_ia32_kordi:
2026 case X86::BI__builtin_ia32_kxnorqi:
2027 case X86::BI__builtin_ia32_kxnorhi:
2028 case X86::BI__builtin_ia32_kxnorsi:
2029 case X86::BI__builtin_ia32_kxnordi:
2032 case X86::BI__builtin_ia32_kxorqi:
2033 case X86::BI__builtin_ia32_kxorhi:
2034 case X86::BI__builtin_ia32_kxorsi:
2035 case X86::BI__builtin_ia32_kxordi:
2038 case X86::BI__builtin_ia32_knotqi:
2039 case X86::BI__builtin_ia32_knothi:
2040 case X86::BI__builtin_ia32_knotsi:
2041 case X86::BI__builtin_ia32_knotdi: {
2043 unsigned numElts = intTy.getWidth();
2044 mlir::Value resVec =
2046 return builder.createBitcast(builder.createNot(resVec), ops[0].getType());
2048 case X86::BI__builtin_ia32_kmovb:
2049 case X86::BI__builtin_ia32_kmovw:
2050 case X86::BI__builtin_ia32_kmovd:
2051 case X86::BI__builtin_ia32_kmovq: {
2056 unsigned numElts = intTy.getWidth();
2057 mlir::Value resVec =
2059 return builder.createBitcast(resVec, ops[0].
getType());
2061 case X86::BI__builtin_ia32_sqrtsh_round_mask:
2062 case X86::BI__builtin_ia32_sqrtsd_round_mask:
2063 case X86::BI__builtin_ia32_sqrtss_round_mask:
2064 cgm.errorNYI(
expr->getSourceRange(),
2065 std::string(
"unimplemented X86 builtin call: ") +
2066 getContext().BuiltinInfo.getName(builtinID));
2067 return mlir::Value{};
2068 case X86::BI__builtin_ia32_sqrtph512:
2069 case X86::BI__builtin_ia32_sqrtps512:
2070 case X86::BI__builtin_ia32_sqrtpd512: {
2071 mlir::Location loc =
getLoc(
expr->getExprLoc());
2072 mlir::Value arg = ops[0];
2073 return cir::SqrtOp::create(builder, loc, arg.getType(), arg).getResult();
2075 case X86::BI__builtin_ia32_pmuludq128:
2076 case X86::BI__builtin_ia32_pmuludq256:
2077 case X86::BI__builtin_ia32_pmuludq512: {
2078 unsigned opTypePrimitiveSizeInBits =
2079 cgm.getDataLayout().getTypeSizeInBits(ops[0].
getType());
2081 ops, opTypePrimitiveSizeInBits);
2083 case X86::BI__builtin_ia32_pmuldq128:
2084 case X86::BI__builtin_ia32_pmuldq256:
2085 case X86::BI__builtin_ia32_pmuldq512: {
2086 unsigned opTypePrimitiveSizeInBits =
2087 cgm.getDataLayout().getTypeSizeInBits(ops[0].
getType());
2089 ops, opTypePrimitiveSizeInBits);
2091 case X86::BI__builtin_ia32_pternlogd512_mask:
2092 case X86::BI__builtin_ia32_pternlogq512_mask:
2093 case X86::BI__builtin_ia32_pternlogd128_mask:
2094 case X86::BI__builtin_ia32_pternlogd256_mask:
2095 case X86::BI__builtin_ia32_pternlogq128_mask:
2096 case X86::BI__builtin_ia32_pternlogq256_mask:
2097 case X86::BI__builtin_ia32_pternlogd512_maskz:
2098 case X86::BI__builtin_ia32_pternlogq512_maskz:
2099 case X86::BI__builtin_ia32_pternlogd128_maskz:
2100 case X86::BI__builtin_ia32_pternlogd256_maskz:
2101 case X86::BI__builtin_ia32_pternlogq128_maskz:
2102 case X86::BI__builtin_ia32_pternlogq256_maskz:
2103 cgm.errorNYI(
expr->getSourceRange(),
2104 std::string(
"unimplemented X86 builtin call: ") +
2105 getContext().BuiltinInfo.getName(builtinID));
2106 return mlir::Value{};
2107 case X86::BI__builtin_ia32_vpshldd128:
2108 case X86::BI__builtin_ia32_vpshldd256:
2109 case X86::BI__builtin_ia32_vpshldd512:
2110 case X86::BI__builtin_ia32_vpshldq128:
2111 case X86::BI__builtin_ia32_vpshldq256:
2112 case X86::BI__builtin_ia32_vpshldq512:
2113 case X86::BI__builtin_ia32_vpshldw128:
2114 case X86::BI__builtin_ia32_vpshldw256:
2115 case X86::BI__builtin_ia32_vpshldw512:
2117 ops[1], ops[2],
false);
2118 case X86::BI__builtin_ia32_vpshrdd128:
2119 case X86::BI__builtin_ia32_vpshrdd256:
2120 case X86::BI__builtin_ia32_vpshrdd512:
2121 case X86::BI__builtin_ia32_vpshrdq128:
2122 case X86::BI__builtin_ia32_vpshrdq256:
2123 case X86::BI__builtin_ia32_vpshrdq512:
2124 case X86::BI__builtin_ia32_vpshrdw128:
2125 case X86::BI__builtin_ia32_vpshrdw256:
2126 case X86::BI__builtin_ia32_vpshrdw512:
2129 ops[0], ops[2],
true);
2130 case X86::BI__builtin_ia32_reduce_fadd_pd512:
2131 case X86::BI__builtin_ia32_reduce_fadd_ps512:
2132 case X86::BI__builtin_ia32_reduce_fadd_ph512:
2133 case X86::BI__builtin_ia32_reduce_fadd_ph256:
2134 case X86::BI__builtin_ia32_reduce_fadd_ph128: {
2136 return builder.emitIntrinsicCallOp(
getLoc(
expr->getExprLoc()),
2137 "vector.reduce.fadd", ops[0].getType(),
2138 mlir::ValueRange{ops[0], ops[1]});
2140 case X86::BI__builtin_ia32_reduce_fmul_pd512:
2141 case X86::BI__builtin_ia32_reduce_fmul_ps512:
2142 case X86::BI__builtin_ia32_reduce_fmul_ph512:
2143 case X86::BI__builtin_ia32_reduce_fmul_ph256:
2144 case X86::BI__builtin_ia32_reduce_fmul_ph128: {
2146 return builder.emitIntrinsicCallOp(
getLoc(
expr->getExprLoc()),
2147 "vector.reduce.fmul", ops[0].getType(),
2148 mlir::ValueRange{ops[0], ops[1]});
2150 case X86::BI__builtin_ia32_reduce_fmax_pd512:
2151 case X86::BI__builtin_ia32_reduce_fmax_ps512:
2152 case X86::BI__builtin_ia32_reduce_fmax_ph512:
2153 case X86::BI__builtin_ia32_reduce_fmax_ph256:
2154 case X86::BI__builtin_ia32_reduce_fmax_ph128: {
2157 return builder.emitIntrinsicCallOp(
2158 getLoc(
expr->getExprLoc()),
"vector.reduce.fmax",
2159 vecTy.getElementType(), mlir::ValueRange{ops[0]});
2161 case X86::BI__builtin_ia32_reduce_fmin_pd512:
2162 case X86::BI__builtin_ia32_reduce_fmin_ps512:
2163 case X86::BI__builtin_ia32_reduce_fmin_ph512:
2164 case X86::BI__builtin_ia32_reduce_fmin_ph256:
2165 case X86::BI__builtin_ia32_reduce_fmin_ph128: {
2168 return builder.emitIntrinsicCallOp(
2169 getLoc(
expr->getExprLoc()),
"vector.reduce.fmin",
2170 vecTy.getElementType(), mlir::ValueRange{ops[0]});
2172 case X86::BI__builtin_ia32_rdrand16_step:
2173 case X86::BI__builtin_ia32_rdrand32_step:
2174 case X86::BI__builtin_ia32_rdrand64_step:
2175 case X86::BI__builtin_ia32_rdseed16_step:
2176 case X86::BI__builtin_ia32_rdseed32_step:
2177 case X86::BI__builtin_ia32_rdseed64_step: {
2178 llvm::StringRef intrinsicName;
2179 switch (builtinID) {
2181 llvm_unreachable(
"Unsupported intrinsic!");
2182 case X86::BI__builtin_ia32_rdrand16_step:
2183 intrinsicName =
"x86.rdrand.16";
2185 case X86::BI__builtin_ia32_rdrand32_step:
2186 intrinsicName =
"x86.rdrand.32";
2188 case X86::BI__builtin_ia32_rdrand64_step:
2189 intrinsicName =
"x86.rdrand.64";
2191 case X86::BI__builtin_ia32_rdseed16_step:
2192 intrinsicName =
"x86.rdseed.16";
2194 case X86::BI__builtin_ia32_rdseed32_step:
2195 intrinsicName =
"x86.rdseed.32";
2197 case X86::BI__builtin_ia32_rdseed64_step:
2198 intrinsicName =
"x86.rdseed.64";
2202 mlir::Location loc =
getLoc(
expr->getExprLoc());
2205 builder.getUInt32Ty()};
2206 cir::RecordType resRecord =
2207 cir::RecordType::get(&
getMLIRContext(), resultTypes,
false,
false,
2208 cir::RecordType::RecordKind::Struct);
2211 builder.emitIntrinsicCallOp(loc, intrinsicName, resRecord);
2213 cir::ExtractMemberOp::create(builder, loc, randTy, call, 0);
2214 builder.CIRBaseBuilderTy::createStore(loc, rand, ops[0]);
2216 return cir::ExtractMemberOp::create(builder, loc, builder.getUInt32Ty(),
2219 case X86::BI__builtin_ia32_addcarryx_u32:
2220 case X86::BI__builtin_ia32_addcarryx_u64:
2221 case X86::BI__builtin_ia32_subborrow_u32:
2222 case X86::BI__builtin_ia32_subborrow_u64:
2223 cgm.errorNYI(
expr->getSourceRange(),
2224 std::string(
"unimplemented X86 builtin call: ") +
2225 getContext().BuiltinInfo.getName(builtinID));
2226 return mlir::Value{};
2227 case X86::BI__builtin_ia32_fpclassps128_mask:
2228 case X86::BI__builtin_ia32_fpclassps256_mask:
2229 case X86::BI__builtin_ia32_fpclassps512_mask:
2230 case X86::BI__builtin_ia32_vfpclassbf16128_mask:
2231 case X86::BI__builtin_ia32_vfpclassbf16256_mask:
2232 case X86::BI__builtin_ia32_vfpclassbf16512_mask:
2233 case X86::BI__builtin_ia32_fpclassph128_mask:
2234 case X86::BI__builtin_ia32_fpclassph256_mask:
2235 case X86::BI__builtin_ia32_fpclassph512_mask:
2236 case X86::BI__builtin_ia32_fpclasspd128_mask:
2237 case X86::BI__builtin_ia32_fpclasspd256_mask:
2238 case X86::BI__builtin_ia32_fpclasspd512_mask:
2240 case X86::BI__builtin_ia32_vp2intersect_q_512:
2241 case X86::BI__builtin_ia32_vp2intersect_q_256:
2242 case X86::BI__builtin_ia32_vp2intersect_q_128:
2243 case X86::BI__builtin_ia32_vp2intersect_d_512:
2244 case X86::BI__builtin_ia32_vp2intersect_d_256:
2245 case X86::BI__builtin_ia32_vp2intersect_d_128: {
2247 mlir::Location loc =
getLoc(
expr->getExprLoc());
2248 StringRef intrinsicName;
2250 switch (builtinID) {
2252 llvm_unreachable(
"Unexpected builtin");
2253 case X86::BI__builtin_ia32_vp2intersect_q_512:
2254 intrinsicName =
"x86.avx512.vp2intersect.q.512";
2256 case X86::BI__builtin_ia32_vp2intersect_q_256:
2257 intrinsicName =
"x86.avx512.vp2intersect.q.256";
2259 case X86::BI__builtin_ia32_vp2intersect_q_128:
2260 intrinsicName =
"x86.avx512.vp2intersect.q.128";
2262 case X86::BI__builtin_ia32_vp2intersect_d_512:
2263 intrinsicName =
"x86.avx512.vp2intersect.d.512";
2265 case X86::BI__builtin_ia32_vp2intersect_d_256:
2266 intrinsicName =
"x86.avx512.vp2intersect.d.256";
2268 case X86::BI__builtin_ia32_vp2intersect_d_128:
2269 intrinsicName =
"x86.avx512.vp2intersect.d.128";
2273 auto resVector = cir::VectorType::get(builder.getBoolTy(), numElts);
2275 cir::RecordType resRecord =
2276 cir::RecordType::get(&
getMLIRContext(), {resVector, resVector},
false,
2277 false, cir::RecordType::RecordKind::Struct);
2279 mlir::Value call = builder.emitIntrinsicCallOp(
2280 getLoc(
expr->getExprLoc()), intrinsicName, resRecord,
2281 mlir::ValueRange{ops[0], ops[1]});
2282 mlir::Value result =
2283 cir::ExtractMemberOp::create(builder, loc, resVector, call, 0);
2287 builder.createStore(loc, result, addr);
2289 result = cir::ExtractMemberOp::create(builder, loc, resVector, call, 1);
2293 builder.createStore(loc, result, addr);
2294 return mlir::Value{};
2296 case X86::BI__builtin_ia32_vpmultishiftqb128:
2297 case X86::BI__builtin_ia32_vpmultishiftqb256:
2298 case X86::BI__builtin_ia32_vpmultishiftqb512:
2299 case X86::BI__builtin_ia32_vpshufbitqmb128_mask:
2300 case X86::BI__builtin_ia32_vpshufbitqmb256_mask:
2301 case X86::BI__builtin_ia32_vpshufbitqmb512_mask:
2302 case X86::BI__builtin_ia32_cmpeqps:
2303 case X86::BI__builtin_ia32_cmpeqpd:
2304 case X86::BI__builtin_ia32_cmpltps:
2305 case X86::BI__builtin_ia32_cmpltpd:
2306 case X86::BI__builtin_ia32_cmpleps:
2307 case X86::BI__builtin_ia32_cmplepd:
2308 case X86::BI__builtin_ia32_cmpunordps:
2309 case X86::BI__builtin_ia32_cmpunordpd:
2310 case X86::BI__builtin_ia32_cmpneqps:
2311 case X86::BI__builtin_ia32_cmpneqpd:
2312 cgm.errorNYI(
expr->getSourceRange(),
2313 std::string(
"unimplemented X86 builtin call: ") +
2314 getContext().BuiltinInfo.getName(builtinID));
2315 return mlir::Value{};
2316 case X86::BI__builtin_ia32_cmpnltps:
2317 case X86::BI__builtin_ia32_cmpnltpd:
2320 case X86::BI__builtin_ia32_cmpnleps:
2321 case X86::BI__builtin_ia32_cmpnlepd:
2324 case X86::BI__builtin_ia32_cmpordps:
2325 case X86::BI__builtin_ia32_cmpordpd:
2326 case X86::BI__builtin_ia32_cmpph128_mask:
2327 case X86::BI__builtin_ia32_cmpph256_mask:
2328 case X86::BI__builtin_ia32_cmpph512_mask:
2329 case X86::BI__builtin_ia32_cmpps128_mask:
2330 case X86::BI__builtin_ia32_cmpps256_mask:
2331 case X86::BI__builtin_ia32_cmpps512_mask:
2332 case X86::BI__builtin_ia32_cmppd128_mask:
2333 case X86::BI__builtin_ia32_cmppd256_mask:
2334 case X86::BI__builtin_ia32_cmppd512_mask:
2335 case X86::BI__builtin_ia32_vcmpbf16512_mask:
2336 case X86::BI__builtin_ia32_vcmpbf16256_mask:
2337 case X86::BI__builtin_ia32_vcmpbf16128_mask:
2338 case X86::BI__builtin_ia32_cmpps:
2339 case X86::BI__builtin_ia32_cmpps256:
2340 case X86::BI__builtin_ia32_cmppd:
2341 case X86::BI__builtin_ia32_cmppd256:
2342 case X86::BI__builtin_ia32_cmpeqss:
2343 case X86::BI__builtin_ia32_cmpltss:
2344 case X86::BI__builtin_ia32_cmpless:
2345 case X86::BI__builtin_ia32_cmpunordss:
2346 case X86::BI__builtin_ia32_cmpneqss:
2347 case X86::BI__builtin_ia32_cmpnltss:
2348 case X86::BI__builtin_ia32_cmpnless:
2349 case X86::BI__builtin_ia32_cmpordss:
2350 case X86::BI__builtin_ia32_cmpeqsd:
2351 case X86::BI__builtin_ia32_cmpltsd:
2352 case X86::BI__builtin_ia32_cmplesd:
2353 case X86::BI__builtin_ia32_cmpunordsd:
2354 case X86::BI__builtin_ia32_cmpneqsd:
2355 case X86::BI__builtin_ia32_cmpnltsd:
2356 case X86::BI__builtin_ia32_cmpnlesd:
2357 case X86::BI__builtin_ia32_cmpordsd:
2358 cgm.errorNYI(
expr->getSourceRange(),
2359 std::string(
"unimplemented X86 builtin call: ") +
2360 getContext().BuiltinInfo.getName(builtinID));
2362 case X86::BI__builtin_ia32_vcvtph2ps_mask:
2363 case X86::BI__builtin_ia32_vcvtph2ps256_mask:
2364 case X86::BI__builtin_ia32_vcvtph2ps512_mask: {
2365 mlir::Location loc =
getLoc(
expr->getExprLoc());
2369 case X86::BI__builtin_ia32_cvtneps2bf16_128_mask: {
2370 mlir::Location loc =
getLoc(
expr->getExprLoc());
2374 unsigned numElts = inputTy.getSize();
2379 args.push_back(ops[0]);
2380 args.push_back(ops[1]);
2381 args.push_back(mask);
2383 return builder.emitIntrinsicCallOp(
2384 loc,
"x86.avx512bf16.mask.cvtneps2bf16.128", resTy, args);
2386 case X86::BI__builtin_ia32_cvtneps2bf16_256_mask:
2387 case X86::BI__builtin_ia32_cvtneps2bf16_512_mask: {
2388 mlir::Location loc =
getLoc(
expr->getExprLoc());
2390 StringRef intrinsicName;
2391 if (builtinID == X86::BI__builtin_ia32_cvtneps2bf16_256_mask) {
2392 intrinsicName =
"x86.avx512bf16.cvtneps2bf16.256";
2394 assert(builtinID == X86::BI__builtin_ia32_cvtneps2bf16_512_mask);
2395 intrinsicName =
"x86.avx512bf16.cvtneps2bf16.512";
2398 mlir::Value res = builder.emitIntrinsicCallOp(loc, intrinsicName, resTy,
2399 mlir::ValueRange{ops[0]});
2403 case X86::BI__cpuid:
2404 case X86::BI__cpuidex: {
2405 mlir::Location loc =
getLoc(
expr->getExprLoc());
2406 mlir::Value subFuncId = builtinID == X86::BI__cpuidex
2408 : builder.getConstInt(loc,
sInt32Ty, 0);
2409 cir::CpuIdOp::create(builder, loc, ops[0],
2411 return mlir::Value{};
2414 case X86::BI__emulu:
2416 case X86::BI__umulh:
2417 case X86::BI_mul128:
2418 case X86::BI_umul128: {
2419 cgm.errorNYI(
expr->getSourceRange(),
2420 std::string(
"unimplemented X86 builtin call: ") +
2421 getContext().BuiltinInfo.getName(builtinID));
2422 return mlir::Value{};
2424 case X86::BI__faststorefence: {
2425 cir::AtomicFenceOp::create(
2427 cir::MemOrder::SequentiallyConsistent,
2429 cir::SyncScopeKind::System));
2430 return mlir::Value{};
2432 case X86::BI__shiftleft128:
2433 case X86::BI__shiftright128: {
2437 std::swap(ops[0], ops[1]);
2440 auto amtTy = mlir::cast<cir::IntType>(ops[2].
getType());
2441 cir::IntType i64Ty = builder.getUInt64Ty();
2444 ops[2] = builder.createIntCast(ops[2], i64Ty);
2446 const StringRef intrinsicName =
2447 (builtinID == X86::BI__shiftleft128) ?
"fshl" :
"fshr";
2448 return builder.emitIntrinsicCallOp(
2449 getLoc(
expr->getExprLoc()), intrinsicName, i64Ty,
2450 mlir::ValueRange{ops[0], ops[1], ops[2]});
2452 case X86::BI_ReadWriteBarrier:
2453 case X86::BI_ReadBarrier:
2454 case X86::BI_WriteBarrier: {
2455 cir::AtomicFenceOp::create(
2457 cir::MemOrder::SequentiallyConsistent,
2459 cir::SyncScopeKind::SingleThread));
2460 return mlir::Value{};
2462 case X86::BI_AddressOfReturnAddress: {
2463 mlir::Location loc =
getLoc(
expr->getExprLoc());
2466 return builder.createCast(loc, cir::CastKind::bitcast, addr,
voidPtrTy);
2468 case X86::BI__stosb:
2470 case X86::BI__int2c:
2471 case X86::BI__readfsbyte:
2472 case X86::BI__readfsword:
2473 case X86::BI__readfsdword:
2474 case X86::BI__readfsqword:
2475 case X86::BI__readgsbyte:
2476 case X86::BI__readgsword:
2477 case X86::BI__readgsdword:
2478 case X86::BI__readgsqword: {
2479 cgm.errorNYI(
expr->getSourceRange(),
2480 std::string(
"unimplemented X86 builtin call: ") +
2481 getContext().BuiltinInfo.getName(builtinID));
2482 return mlir::Value{};
2484 case X86::BI__builtin_ia32_encodekey128_u32: {
2486 {ops[0], ops[1]}, ops[2], 6,
"x86.encodekey128", 3);
2488 case X86::BI__builtin_ia32_encodekey256_u32: {
2491 {ops[0], ops[1], ops[2]}, ops[3], 7,
2492 "x86.encodekey256", 4);
2495 case X86::BI__builtin_ia32_aesenc128kl_u8:
2496 case X86::BI__builtin_ia32_aesdec128kl_u8:
2497 case X86::BI__builtin_ia32_aesenc256kl_u8:
2498 case X86::BI__builtin_ia32_aesdec256kl_u8: {
2499 llvm::StringRef intrinsicName;
2500 switch (builtinID) {
2502 llvm_unreachable(
"Unexpected builtin");
2503 case X86::BI__builtin_ia32_aesenc128kl_u8:
2504 intrinsicName =
"x86.aesenc128kl";
2506 case X86::BI__builtin_ia32_aesdec128kl_u8:
2507 intrinsicName =
"x86.aesdec128kl";
2509 case X86::BI__builtin_ia32_aesenc256kl_u8:
2510 intrinsicName =
"x86.aesenc256kl";
2512 case X86::BI__builtin_ia32_aesdec256kl_u8:
2513 intrinsicName =
"x86.aesdec256kl";
2520 case X86::BI__builtin_ia32_aesencwide128kl_u8:
2521 case X86::BI__builtin_ia32_aesdecwide128kl_u8:
2522 case X86::BI__builtin_ia32_aesencwide256kl_u8:
2523 case X86::BI__builtin_ia32_aesdecwide256kl_u8: {
2524 llvm::StringRef intrinsicName;
2525 switch (builtinID) {
2527 llvm_unreachable(
"Unexpected builtin");
2528 case X86::BI__builtin_ia32_aesencwide128kl_u8:
2529 intrinsicName =
"x86.aesencwide128kl";
2531 case X86::BI__builtin_ia32_aesdecwide128kl_u8:
2532 intrinsicName =
"x86.aesdecwide128kl";
2534 case X86::BI__builtin_ia32_aesencwide256kl_u8:
2535 intrinsicName =
"x86.aesencwide256kl";
2537 case X86::BI__builtin_ia32_aesdecwide256kl_u8:
2538 intrinsicName =
"x86.aesdecwide256kl";
2545 case X86::BI__builtin_ia32_vfcmaddcph512_mask:
2546 case X86::BI__builtin_ia32_vfmaddcph512_mask:
2547 case X86::BI__builtin_ia32_vfcmaddcsh_round_mask:
2548 case X86::BI__builtin_ia32_vfmaddcsh_round_mask:
2549 case X86::BI__builtin_ia32_vfcmaddcsh_round_mask3:
2550 case X86::BI__builtin_ia32_vfmaddcsh_round_mask3:
2551 case X86::BI__builtin_ia32_prefetchi:
2552 cgm.errorNYI(
expr->getSourceRange(),
2553 std::string(
"unimplemented X86 builtin call: ") +
2554 getContext().BuiltinInfo.getName(builtinID));
2555 return mlir::Value{};